]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - fs/gfs2/glock.c
seq_file: Add seq_vprintf function and export it
[mirror_ubuntu-artful-kernel.git] / fs / gfs2 / glock.c
CommitLineData
b3b94faa
DT
1/*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
cf45b752 3 * Copyright (C) 2004-2008 Red Hat, Inc. All rights reserved.
b3b94faa
DT
4 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
e9fc2aa0 7 * of the GNU General Public License version 2.
b3b94faa
DT
8 */
9
10#include <linux/sched.h>
11#include <linux/slab.h>
12#include <linux/spinlock.h>
b3b94faa
DT
13#include <linux/buffer_head.h>
14#include <linux/delay.h>
15#include <linux/sort.h>
16#include <linux/jhash.h>
d0dc80db 17#include <linux/kallsyms.h>
5c676f6d 18#include <linux/gfs2_ondisk.h>
24264434 19#include <linux/list.h>
fee852e3 20#include <linux/wait.h>
95d97b7d 21#include <linux/module.h>
b3b94faa 22#include <asm/uaccess.h>
7c52b166
RP
23#include <linux/seq_file.h>
24#include <linux/debugfs.h>
8fbbfd21
SW
25#include <linux/kthread.h>
26#include <linux/freezer.h>
c4f68a13
BM
27#include <linux/workqueue.h>
28#include <linux/jiffies.h>
bc015cb8
SW
29#include <linux/rcupdate.h>
30#include <linux/rculist_bl.h>
31#include <linux/bit_spinlock.h>
a245769f 32#include <linux/percpu.h>
b3b94faa
DT
33
34#include "gfs2.h"
5c676f6d 35#include "incore.h"
b3b94faa
DT
36#include "glock.h"
37#include "glops.h"
38#include "inode.h"
b3b94faa
DT
39#include "lops.h"
40#include "meta_io.h"
41#include "quota.h"
42#include "super.h"
5c676f6d 43#include "util.h"
813e0c46 44#include "bmap.h"
63997775
SW
45#define CREATE_TRACE_POINTS
46#include "trace_gfs2.h"
b3b94faa 47
6802e340 48struct gfs2_glock_iter {
ba1ddcb6
SW
49 int hash; /* hash bucket index */
50 unsigned nhash; /* Index within current bucket */
51 struct gfs2_sbd *sdp; /* incore superblock */
52 struct gfs2_glock *gl; /* current glock struct */
53 loff_t last_pos; /* last position */
54 char string[512]; /* scratch space */
7c52b166
RP
55};
56
b3b94faa
DT
57typedef void (*glock_examiner) (struct gfs2_glock * gl);
58
6802e340
SW
59static int __dump_glock(struct seq_file *seq, const struct gfs2_glock *gl);
60#define GLOCK_BUG_ON(gl,x) do { if (unlikely(x)) { __dump_glock(NULL, gl); BUG(); } } while(0)
61static void do_xmote(struct gfs2_glock *gl, struct gfs2_holder *gh, unsigned int target);
c4f68a13 62
7c52b166 63static struct dentry *gfs2_root;
c4f68a13 64static struct workqueue_struct *glock_workqueue;
b94a170e 65struct workqueue_struct *gfs2_delete_workqueue;
97cc1025
SW
66static LIST_HEAD(lru_list);
67static atomic_t lru_count = ATOMIC_INIT(0);
eb8374e7 68static DEFINE_SPINLOCK(lru_lock);
08bc2dbc 69
b6397893 70#define GFS2_GL_HASH_SHIFT 15
087efdd3
SW
71#define GFS2_GL_HASH_SIZE (1 << GFS2_GL_HASH_SHIFT)
72#define GFS2_GL_HASH_MASK (GFS2_GL_HASH_SIZE - 1)
73
bc015cb8 74static struct hlist_bl_head gl_hash_table[GFS2_GL_HASH_SIZE];
04b933f2 75static struct dentry *gfs2_root;
087efdd3 76
b3b94faa
DT
77/**
78 * gl_hash() - Turn glock number into hash bucket number
79 * @lock: The glock number
80 *
81 * Returns: The number of the corresponding hash bucket
82 */
83
b8547856
SW
84static unsigned int gl_hash(const struct gfs2_sbd *sdp,
85 const struct lm_lockname *name)
b3b94faa
DT
86{
87 unsigned int h;
88
cd915493 89 h = jhash(&name->ln_number, sizeof(u64), 0);
b3b94faa 90 h = jhash(&name->ln_type, sizeof(unsigned int), h);
b8547856 91 h = jhash(&sdp, sizeof(struct gfs2_sbd *), h);
b3b94faa
DT
92 h &= GFS2_GL_HASH_MASK;
93
94 return h;
95}
96
bc015cb8
SW
97static inline void spin_lock_bucket(unsigned int hash)
98{
1879fd6a 99 hlist_bl_lock(&gl_hash_table[hash]);
bc015cb8 100}
b3b94faa 101
bc015cb8
SW
102static inline void spin_unlock_bucket(unsigned int hash)
103{
1879fd6a 104 hlist_bl_unlock(&gl_hash_table[hash]);
bc015cb8 105}
b3b94faa 106
fc0e38da 107static void gfs2_glock_dealloc(struct rcu_head *rcu)
b3b94faa 108{
bc015cb8 109 struct gfs2_glock *gl = container_of(rcu, struct gfs2_glock, gl_rcu);
b3b94faa 110
bc015cb8
SW
111 if (gl->gl_ops->go_flags & GLOF_ASPACE)
112 kmem_cache_free(gfs2_glock_aspace_cachep, gl);
113 else
114 kmem_cache_free(gfs2_glock_cachep, gl);
fc0e38da
SW
115}
116
117void gfs2_glock_free(struct gfs2_glock *gl)
b3b94faa
DT
118{
119 struct gfs2_sbd *sdp = gl->gl_sbd;
b3b94faa 120
fc0e38da 121 call_rcu(&gl->gl_rcu, gfs2_glock_dealloc);
bc015cb8
SW
122 if (atomic_dec_and_test(&sdp->sd_glock_disposal))
123 wake_up(&sdp->sd_glock_wait);
b3b94faa
DT
124}
125
126/**
127 * gfs2_glock_hold() - increment reference count on glock
128 * @gl: The glock to hold
129 *
130 */
131
b94a170e 132void gfs2_glock_hold(struct gfs2_glock *gl)
b3b94faa 133{
d8348de0 134 GLOCK_BUG_ON(gl, atomic_read(&gl->gl_ref) == 0);
16feb9fe 135 atomic_inc(&gl->gl_ref);
b3b94faa
DT
136}
137
8ff22a6f
BM
138/**
139 * demote_ok - Check to see if it's ok to unlock a glock
140 * @gl: the glock
141 *
142 * Returns: 1 if it's ok
143 */
144
145static int demote_ok(const struct gfs2_glock *gl)
146{
147 const struct gfs2_glock_operations *glops = gl->gl_ops;
148
149 if (gl->gl_state == LM_ST_UNLOCKED)
150 return 0;
f42ab085 151 if (!list_empty(&gl->gl_holders))
8ff22a6f
BM
152 return 0;
153 if (glops->go_demote_ok)
154 return glops->go_demote_ok(gl);
155 return 1;
156}
157
bc015cb8 158
29687a2a
SW
159void gfs2_glock_add_to_lru(struct gfs2_glock *gl)
160{
161 spin_lock(&lru_lock);
162
163 if (!list_empty(&gl->gl_lru))
164 list_del_init(&gl->gl_lru);
165 else
166 atomic_inc(&lru_count);
167
168 list_add_tail(&gl->gl_lru, &lru_list);
627c10b7 169 set_bit(GLF_LRU, &gl->gl_flags);
29687a2a
SW
170 spin_unlock(&lru_lock);
171}
172
4043b886 173static void __gfs2_glock_remove_from_lru(struct gfs2_glock *gl)
f42ab085 174{
f42ab085
SW
175 if (!list_empty(&gl->gl_lru)) {
176 list_del_init(&gl->gl_lru);
177 atomic_dec(&lru_count);
178 clear_bit(GLF_LRU, &gl->gl_flags);
179 }
4043b886
SW
180}
181
182static void gfs2_glock_remove_from_lru(struct gfs2_glock *gl)
183{
184 spin_lock(&lru_lock);
185 __gfs2_glock_remove_from_lru(gl);
f42ab085
SW
186 spin_unlock(&lru_lock);
187}
188
97cc1025 189/**
bc015cb8 190 * __gfs2_glock_schedule_for_reclaim - Add a glock to the reclaim list
97cc1025
SW
191 * @gl: the glock
192 *
bc015cb8
SW
193 * If the glock is demotable, then we add it (or move it) to the end
194 * of the glock LRU list.
97cc1025
SW
195 */
196
bc015cb8 197static void __gfs2_glock_schedule_for_reclaim(struct gfs2_glock *gl)
97cc1025 198{
29687a2a
SW
199 if (demote_ok(gl))
200 gfs2_glock_add_to_lru(gl);
97cc1025
SW
201}
202
8ff22a6f
BM
203/**
204 * gfs2_glock_put_nolock() - Decrement reference count on glock
205 * @gl: The glock to put
206 *
207 * This function should only be used if the caller has its own reference
208 * to the glock, in addition to the one it is dropping.
209 */
210
b94a170e 211void gfs2_glock_put_nolock(struct gfs2_glock *gl)
8ff22a6f
BM
212{
213 if (atomic_dec_and_test(&gl->gl_ref))
214 GLOCK_BUG_ON(gl, 1);
8ff22a6f
BM
215}
216
b3b94faa
DT
217/**
218 * gfs2_glock_put() - Decrement reference count on glock
219 * @gl: The glock to put
220 *
221 */
222
bc015cb8 223void gfs2_glock_put(struct gfs2_glock *gl)
b3b94faa 224{
bc015cb8
SW
225 struct gfs2_sbd *sdp = gl->gl_sbd;
226 struct address_space *mapping = gfs2_glock2aspace(gl);
b3b94faa 227
4043b886
SW
228 if (atomic_dec_and_lock(&gl->gl_ref, &lru_lock)) {
229 __gfs2_glock_remove_from_lru(gl);
230 spin_unlock(&lru_lock);
bc015cb8
SW
231 spin_lock_bucket(gl->gl_hash);
232 hlist_bl_del_rcu(&gl->gl_list);
233 spin_unlock_bucket(gl->gl_hash);
6802e340 234 GLOCK_BUG_ON(gl, !list_empty(&gl->gl_holders));
bc015cb8
SW
235 GLOCK_BUG_ON(gl, mapping && mapping->nrpages);
236 trace_gfs2_glock_put(gl);
237 sdp->sd_lockstruct.ls_ops->lm_put_lock(gl);
b3b94faa 238 }
b3b94faa
DT
239}
240
b3b94faa
DT
241/**
242 * search_bucket() - Find struct gfs2_glock by lock number
243 * @bucket: the bucket to search
244 * @name: The lock name
245 *
246 * Returns: NULL, or the struct gfs2_glock with the requested number
247 */
248
37b2fa6a 249static struct gfs2_glock *search_bucket(unsigned int hash,
899be4d3 250 const struct gfs2_sbd *sdp,
d6a53727 251 const struct lm_lockname *name)
b3b94faa
DT
252{
253 struct gfs2_glock *gl;
bc015cb8 254 struct hlist_bl_node *h;
b3b94faa 255
bc015cb8 256 hlist_bl_for_each_entry_rcu(gl, h, &gl_hash_table[hash], gl_list) {
b3b94faa
DT
257 if (!lm_name_equal(&gl->gl_name, name))
258 continue;
899be4d3
SW
259 if (gl->gl_sbd != sdp)
260 continue;
bc015cb8
SW
261 if (atomic_inc_not_zero(&gl->gl_ref))
262 return gl;
b3b94faa
DT
263 }
264
265 return NULL;
266}
267
6802e340
SW
268/**
269 * may_grant - check if its ok to grant a new lock
270 * @gl: The glock
271 * @gh: The lock request which we wish to grant
272 *
273 * Returns: true if its ok to grant the lock
274 */
275
276static inline int may_grant(const struct gfs2_glock *gl, const struct gfs2_holder *gh)
277{
278 const struct gfs2_holder *gh_head = list_entry(gl->gl_holders.next, const struct gfs2_holder, gh_list);
279 if ((gh->gh_state == LM_ST_EXCLUSIVE ||
280 gh_head->gh_state == LM_ST_EXCLUSIVE) && gh != gh_head)
281 return 0;
282 if (gl->gl_state == gh->gh_state)
283 return 1;
284 if (gh->gh_flags & GL_EXACT)
285 return 0;
209806ab
SW
286 if (gl->gl_state == LM_ST_EXCLUSIVE) {
287 if (gh->gh_state == LM_ST_SHARED && gh_head->gh_state == LM_ST_SHARED)
288 return 1;
289 if (gh->gh_state == LM_ST_DEFERRED && gh_head->gh_state == LM_ST_DEFERRED)
290 return 1;
291 }
6802e340
SW
292 if (gl->gl_state != LM_ST_UNLOCKED && (gh->gh_flags & LM_FLAG_ANY))
293 return 1;
294 return 0;
295}
296
297static void gfs2_holder_wake(struct gfs2_holder *gh)
298{
299 clear_bit(HIF_WAIT, &gh->gh_iflags);
300 smp_mb__after_clear_bit();
301 wake_up_bit(&gh->gh_iflags, HIF_WAIT);
302}
303
d5341a92
SW
304/**
305 * do_error - Something unexpected has happened during a lock request
306 *
307 */
308
309static inline void do_error(struct gfs2_glock *gl, const int ret)
310{
311 struct gfs2_holder *gh, *tmp;
312
313 list_for_each_entry_safe(gh, tmp, &gl->gl_holders, gh_list) {
314 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
315 continue;
316 if (ret & LM_OUT_ERROR)
317 gh->gh_error = -EIO;
318 else if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))
319 gh->gh_error = GLR_TRYFAILED;
320 else
321 continue;
322 list_del_init(&gh->gh_list);
323 trace_gfs2_glock_queue(gh, 0);
324 gfs2_holder_wake(gh);
325 }
326}
327
6802e340
SW
328/**
329 * do_promote - promote as many requests as possible on the current queue
330 * @gl: The glock
331 *
813e0c46
SW
332 * Returns: 1 if there is a blocked holder at the head of the list, or 2
333 * if a type specific operation is underway.
6802e340
SW
334 */
335
336static int do_promote(struct gfs2_glock *gl)
55ba474d
HH
337__releases(&gl->gl_spin)
338__acquires(&gl->gl_spin)
6802e340
SW
339{
340 const struct gfs2_glock_operations *glops = gl->gl_ops;
341 struct gfs2_holder *gh, *tmp;
342 int ret;
343
344restart:
345 list_for_each_entry_safe(gh, tmp, &gl->gl_holders, gh_list) {
346 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
347 continue;
348 if (may_grant(gl, gh)) {
349 if (gh->gh_list.prev == &gl->gl_holders &&
350 glops->go_lock) {
351 spin_unlock(&gl->gl_spin);
352 /* FIXME: eliminate this eventually */
353 ret = glops->go_lock(gh);
354 spin_lock(&gl->gl_spin);
355 if (ret) {
813e0c46
SW
356 if (ret == 1)
357 return 2;
6802e340
SW
358 gh->gh_error = ret;
359 list_del_init(&gh->gh_list);
63997775 360 trace_gfs2_glock_queue(gh, 0);
6802e340
SW
361 gfs2_holder_wake(gh);
362 goto restart;
363 }
364 set_bit(HIF_HOLDER, &gh->gh_iflags);
63997775 365 trace_gfs2_promote(gh, 1);
6802e340
SW
366 gfs2_holder_wake(gh);
367 goto restart;
368 }
369 set_bit(HIF_HOLDER, &gh->gh_iflags);
63997775 370 trace_gfs2_promote(gh, 0);
6802e340
SW
371 gfs2_holder_wake(gh);
372 continue;
373 }
374 if (gh->gh_list.prev == &gl->gl_holders)
375 return 1;
d5341a92 376 do_error(gl, 0);
6802e340
SW
377 break;
378 }
379 return 0;
380}
381
6802e340
SW
382/**
383 * find_first_waiter - find the first gh that's waiting for the glock
384 * @gl: the glock
385 */
386
387static inline struct gfs2_holder *find_first_waiter(const struct gfs2_glock *gl)
388{
389 struct gfs2_holder *gh;
390
391 list_for_each_entry(gh, &gl->gl_holders, gh_list) {
392 if (!test_bit(HIF_HOLDER, &gh->gh_iflags))
393 return gh;
394 }
395 return NULL;
396}
397
398/**
399 * state_change - record that the glock is now in a different state
400 * @gl: the glock
401 * @new_state the new state
402 *
403 */
404
405static void state_change(struct gfs2_glock *gl, unsigned int new_state)
406{
407 int held1, held2;
408
409 held1 = (gl->gl_state != LM_ST_UNLOCKED);
410 held2 = (new_state != LM_ST_UNLOCKED);
411
412 if (held1 != held2) {
413 if (held2)
414 gfs2_glock_hold(gl);
415 else
8ff22a6f 416 gfs2_glock_put_nolock(gl);
6802e340 417 }
7b5e3d5f
SW
418 if (held1 && held2 && list_empty(&gl->gl_holders))
419 clear_bit(GLF_QUEUED, &gl->gl_flags);
6802e340 420
7cf8dcd3
BP
421 if (new_state != gl->gl_target)
422 /* shorten our minimum hold time */
423 gl->gl_hold_time = max(gl->gl_hold_time - GL_GLOCK_HOLD_DECR,
424 GL_GLOCK_MIN_HOLD);
6802e340
SW
425 gl->gl_state = new_state;
426 gl->gl_tchange = jiffies;
427}
428
429static void gfs2_demote_wake(struct gfs2_glock *gl)
430{
431 gl->gl_demote_state = LM_ST_EXCLUSIVE;
432 clear_bit(GLF_DEMOTE, &gl->gl_flags);
433 smp_mb__after_clear_bit();
434 wake_up_bit(&gl->gl_flags, GLF_DEMOTE);
435}
436
437/**
438 * finish_xmote - The DLM has replied to one of our lock requests
439 * @gl: The glock
440 * @ret: The status from the DLM
441 *
442 */
443
444static void finish_xmote(struct gfs2_glock *gl, unsigned int ret)
445{
446 const struct gfs2_glock_operations *glops = gl->gl_ops;
447 struct gfs2_holder *gh;
448 unsigned state = ret & LM_OUT_ST_MASK;
813e0c46 449 int rv;
6802e340
SW
450
451 spin_lock(&gl->gl_spin);
63997775 452 trace_gfs2_glock_state_change(gl, state);
6802e340
SW
453 state_change(gl, state);
454 gh = find_first_waiter(gl);
455
456 /* Demote to UN request arrived during demote to SH or DF */
457 if (test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags) &&
458 state != LM_ST_UNLOCKED && gl->gl_demote_state == LM_ST_UNLOCKED)
459 gl->gl_target = LM_ST_UNLOCKED;
460
461 /* Check for state != intended state */
462 if (unlikely(state != gl->gl_target)) {
463 if (gh && !test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags)) {
464 /* move to back of queue and try next entry */
465 if (ret & LM_OUT_CANCELED) {
466 if ((gh->gh_flags & LM_FLAG_PRIORITY) == 0)
467 list_move_tail(&gh->gh_list, &gl->gl_holders);
468 gh = find_first_waiter(gl);
469 gl->gl_target = gh->gh_state;
470 goto retry;
471 }
472 /* Some error or failed "try lock" - report it */
473 if ((ret & LM_OUT_ERROR) ||
474 (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))) {
475 gl->gl_target = gl->gl_state;
476 do_error(gl, ret);
477 goto out;
478 }
479 }
480 switch(state) {
481 /* Unlocked due to conversion deadlock, try again */
482 case LM_ST_UNLOCKED:
483retry:
484 do_xmote(gl, gh, gl->gl_target);
485 break;
486 /* Conversion fails, unlock and try again */
487 case LM_ST_SHARED:
488 case LM_ST_DEFERRED:
489 do_xmote(gl, gh, LM_ST_UNLOCKED);
490 break;
491 default: /* Everything else */
492 printk(KERN_ERR "GFS2: wanted %u got %u\n", gl->gl_target, state);
493 GLOCK_BUG_ON(gl, 1);
494 }
495 spin_unlock(&gl->gl_spin);
6802e340
SW
496 return;
497 }
498
499 /* Fast path - we got what we asked for */
500 if (test_and_clear_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags))
501 gfs2_demote_wake(gl);
502 if (state != LM_ST_UNLOCKED) {
503 if (glops->go_xmote_bh) {
6802e340
SW
504 spin_unlock(&gl->gl_spin);
505 rv = glops->go_xmote_bh(gl, gh);
6802e340
SW
506 spin_lock(&gl->gl_spin);
507 if (rv) {
508 do_error(gl, rv);
509 goto out;
510 }
511 }
813e0c46
SW
512 rv = do_promote(gl);
513 if (rv == 2)
514 goto out_locked;
6802e340
SW
515 }
516out:
517 clear_bit(GLF_LOCK, &gl->gl_flags);
813e0c46 518out_locked:
6802e340 519 spin_unlock(&gl->gl_spin);
6802e340
SW
520}
521
6802e340
SW
522/**
523 * do_xmote - Calls the DLM to change the state of a lock
524 * @gl: The lock state
525 * @gh: The holder (only for promotes)
526 * @target: The target lock state
527 *
528 */
529
530static void do_xmote(struct gfs2_glock *gl, struct gfs2_holder *gh, unsigned int target)
55ba474d
HH
531__releases(&gl->gl_spin)
532__acquires(&gl->gl_spin)
6802e340
SW
533{
534 const struct gfs2_glock_operations *glops = gl->gl_ops;
535 struct gfs2_sbd *sdp = gl->gl_sbd;
536 unsigned int lck_flags = gh ? gh->gh_flags : 0;
537 int ret;
538
539 lck_flags &= (LM_FLAG_TRY | LM_FLAG_TRY_1CB | LM_FLAG_NOEXP |
540 LM_FLAG_PRIORITY);
921169ca
SW
541 GLOCK_BUG_ON(gl, gl->gl_state == target);
542 GLOCK_BUG_ON(gl, gl->gl_state == gl->gl_target);
6802e340
SW
543 if ((target == LM_ST_UNLOCKED || target == LM_ST_DEFERRED) &&
544 glops->go_inval) {
545 set_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags);
546 do_error(gl, 0); /* Fail queued try locks */
547 }
47a25380 548 gl->gl_req = target;
a245769f
SW
549 set_bit(GLF_BLOCKING, &gl->gl_flags);
550 if ((gl->gl_req == LM_ST_UNLOCKED) ||
551 (gl->gl_state == LM_ST_EXCLUSIVE) ||
552 (lck_flags & (LM_FLAG_TRY|LM_FLAG_TRY_1CB)))
553 clear_bit(GLF_BLOCKING, &gl->gl_flags);
6802e340
SW
554 spin_unlock(&gl->gl_spin);
555 if (glops->go_xmote_th)
556 glops->go_xmote_th(gl);
557 if (test_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags))
558 glops->go_inval(gl, target == LM_ST_DEFERRED ? 0 : DIO_METADATA);
559 clear_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags);
560
561 gfs2_glock_hold(gl);
921169ca
SW
562 if (sdp->sd_lockstruct.ls_ops->lm_lock) {
563 /* lock_dlm */
564 ret = sdp->sd_lockstruct.ls_ops->lm_lock(gl, target, lck_flags);
565 GLOCK_BUG_ON(gl, ret);
566 } else { /* lock_nolock */
567 finish_xmote(gl, target);
6802e340
SW
568 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
569 gfs2_glock_put(gl);
6802e340 570 }
921169ca 571
6802e340
SW
572 spin_lock(&gl->gl_spin);
573}
574
575/**
576 * find_first_holder - find the first "holder" gh
577 * @gl: the glock
578 */
579
580static inline struct gfs2_holder *find_first_holder(const struct gfs2_glock *gl)
581{
582 struct gfs2_holder *gh;
583
584 if (!list_empty(&gl->gl_holders)) {
585 gh = list_entry(gl->gl_holders.next, struct gfs2_holder, gh_list);
586 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
587 return gh;
588 }
589 return NULL;
590}
591
592/**
593 * run_queue - do all outstanding tasks related to a glock
594 * @gl: The glock in question
595 * @nonblock: True if we must not block in run_queue
596 *
597 */
598
599static void run_queue(struct gfs2_glock *gl, const int nonblock)
55ba474d
HH
600__releases(&gl->gl_spin)
601__acquires(&gl->gl_spin)
6802e340
SW
602{
603 struct gfs2_holder *gh = NULL;
813e0c46 604 int ret;
6802e340
SW
605
606 if (test_and_set_bit(GLF_LOCK, &gl->gl_flags))
607 return;
608
609 GLOCK_BUG_ON(gl, test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags));
610
611 if (test_bit(GLF_DEMOTE, &gl->gl_flags) &&
612 gl->gl_demote_state != gl->gl_state) {
613 if (find_first_holder(gl))
d8348de0 614 goto out_unlock;
6802e340
SW
615 if (nonblock)
616 goto out_sched;
617 set_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags);
265d529c 618 GLOCK_BUG_ON(gl, gl->gl_demote_state == LM_ST_EXCLUSIVE);
6802e340
SW
619 gl->gl_target = gl->gl_demote_state;
620 } else {
621 if (test_bit(GLF_DEMOTE, &gl->gl_flags))
622 gfs2_demote_wake(gl);
813e0c46
SW
623 ret = do_promote(gl);
624 if (ret == 0)
d8348de0 625 goto out_unlock;
813e0c46 626 if (ret == 2)
a228df63 627 goto out;
6802e340
SW
628 gh = find_first_waiter(gl);
629 gl->gl_target = gh->gh_state;
630 if (!(gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)))
631 do_error(gl, 0); /* Fail queued try locks */
632 }
633 do_xmote(gl, gh, gl->gl_target);
a228df63 634out:
6802e340
SW
635 return;
636
637out_sched:
7e71c55e
SW
638 clear_bit(GLF_LOCK, &gl->gl_flags);
639 smp_mb__after_clear_bit();
6802e340
SW
640 gfs2_glock_hold(gl);
641 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
8ff22a6f 642 gfs2_glock_put_nolock(gl);
7e71c55e
SW
643 return;
644
d8348de0 645out_unlock:
6802e340 646 clear_bit(GLF_LOCK, &gl->gl_flags);
7e71c55e
SW
647 smp_mb__after_clear_bit();
648 return;
6802e340
SW
649}
650
b94a170e
BM
651static void delete_work_func(struct work_struct *work)
652{
653 struct gfs2_glock *gl = container_of(work, struct gfs2_glock, gl_delete);
654 struct gfs2_sbd *sdp = gl->gl_sbd;
044b9414 655 struct gfs2_inode *ip;
b94a170e 656 struct inode *inode;
044b9414
SW
657 u64 no_addr = gl->gl_name.ln_number;
658
659 ip = gl->gl_object;
660 /* Note: Unsafe to dereference ip as we don't hold right refs/locks */
b94a170e 661
b94a170e 662 if (ip)
4667a0ec 663 inode = gfs2_ilookup(sdp->sd_vfs, no_addr, 1);
044b9414
SW
664 else
665 inode = gfs2_lookup_by_inum(sdp, no_addr, NULL, GFS2_BLKST_UNLINKED);
666 if (inode && !IS_ERR(inode)) {
667 d_prune_aliases(inode);
668 iput(inode);
b94a170e
BM
669 }
670 gfs2_glock_put(gl);
671}
672
c4f68a13
BM
673static void glock_work_func(struct work_struct *work)
674{
6802e340 675 unsigned long delay = 0;
c4f68a13 676 struct gfs2_glock *gl = container_of(work, struct gfs2_glock, gl_work.work);
26bb7505 677 int drop_ref = 0;
c4f68a13 678
26bb7505 679 if (test_and_clear_bit(GLF_REPLY_PENDING, &gl->gl_flags)) {
6802e340 680 finish_xmote(gl, gl->gl_reply);
26bb7505
SW
681 drop_ref = 1;
682 }
c4f68a13 683 spin_lock(&gl->gl_spin);
f90e5b5b 684 if (test_bit(GLF_PENDING_DEMOTE, &gl->gl_flags) &&
265d529c
SW
685 gl->gl_state != LM_ST_UNLOCKED &&
686 gl->gl_demote_state != LM_ST_EXCLUSIVE) {
6802e340 687 unsigned long holdtime, now = jiffies;
f90e5b5b 688
7cf8dcd3 689 holdtime = gl->gl_tchange + gl->gl_hold_time;
6802e340
SW
690 if (time_before(now, holdtime))
691 delay = holdtime - now;
f90e5b5b
BP
692
693 if (!delay) {
694 clear_bit(GLF_PENDING_DEMOTE, &gl->gl_flags);
695 set_bit(GLF_DEMOTE, &gl->gl_flags);
696 }
6802e340
SW
697 }
698 run_queue(gl, 0);
c4f68a13 699 spin_unlock(&gl->gl_spin);
7cf8dcd3 700 if (!delay)
6802e340 701 gfs2_glock_put(gl);
7cf8dcd3
BP
702 else {
703 if (gl->gl_name.ln_type != LM_TYPE_INODE)
704 delay = 0;
705 if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
706 gfs2_glock_put(gl);
707 }
26bb7505
SW
708 if (drop_ref)
709 gfs2_glock_put(gl);
c4f68a13
BM
710}
711
b3b94faa
DT
712/**
713 * gfs2_glock_get() - Get a glock, or create one if one doesn't exist
714 * @sdp: The GFS2 superblock
715 * @number: the lock number
716 * @glops: The glock_operations to use
717 * @create: If 0, don't create the glock if it doesn't exist
718 * @glp: the glock is returned here
719 *
720 * This does not lock a glock, just finds/creates structures for one.
721 *
722 * Returns: errno
723 */
724
cd915493 725int gfs2_glock_get(struct gfs2_sbd *sdp, u64 number,
8fb4b536 726 const struct gfs2_glock_operations *glops, int create,
b3b94faa
DT
727 struct gfs2_glock **glp)
728{
009d8518 729 struct super_block *s = sdp->sd_vfs;
37b2fa6a 730 struct lm_lockname name = { .ln_number = number, .ln_type = glops->go_type };
b3b94faa 731 struct gfs2_glock *gl, *tmp;
37b2fa6a 732 unsigned int hash = gl_hash(sdp, &name);
009d8518 733 struct address_space *mapping;
bc015cb8 734 struct kmem_cache *cachep;
b3b94faa 735
bc015cb8 736 rcu_read_lock();
37b2fa6a 737 gl = search_bucket(hash, sdp, &name);
bc015cb8 738 rcu_read_unlock();
b3b94faa 739
64d576ba
SW
740 *glp = gl;
741 if (gl)
b3b94faa 742 return 0;
64d576ba
SW
743 if (!create)
744 return -ENOENT;
b3b94faa 745
009d8518 746 if (glops->go_flags & GLOF_ASPACE)
bc015cb8 747 cachep = gfs2_glock_aspace_cachep;
009d8518 748 else
bc015cb8
SW
749 cachep = gfs2_glock_cachep;
750 gl = kmem_cache_alloc(cachep, GFP_KERNEL);
b3b94faa
DT
751 if (!gl)
752 return -ENOMEM;
753
8f05228e 754 atomic_inc(&sdp->sd_glock_disposal);
a245769f 755 gl->gl_sbd = sdp;
ec45d9f5 756 gl->gl_flags = 0;
b3b94faa 757 gl->gl_name = name;
16feb9fe 758 atomic_set(&gl->gl_ref, 1);
b3b94faa 759 gl->gl_state = LM_ST_UNLOCKED;
6802e340 760 gl->gl_target = LM_ST_UNLOCKED;
c4f68a13 761 gl->gl_demote_state = LM_ST_EXCLUSIVE;
37b2fa6a 762 gl->gl_hash = hash;
b3b94faa 763 gl->gl_ops = glops;
a245769f
SW
764 gl->gl_dstamp = ktime_set(0, 0);
765 preempt_disable();
766 /* We use the global stats to estimate the initial per-glock stats */
767 gl->gl_stats = this_cpu_ptr(sdp->sd_lkstats)->lkstats[glops->go_type];
768 preempt_enable();
769 gl->gl_stats.stats[GFS2_LKS_DCOUNT] = 0;
770 gl->gl_stats.stats[GFS2_LKS_QCOUNT] = 0;
f057f6cd 771 memset(&gl->gl_lksb, 0, sizeof(struct dlm_lksb));
90306c41 772 memset(gl->gl_lvb, 0, 32 * sizeof(char));
f057f6cd 773 gl->gl_lksb.sb_lvbptr = gl->gl_lvb;
c4f68a13 774 gl->gl_tchange = jiffies;
ec45d9f5 775 gl->gl_object = NULL;
7cf8dcd3 776 gl->gl_hold_time = GL_GLOCK_DFT_HOLD;
c4f68a13 777 INIT_DELAYED_WORK(&gl->gl_work, glock_work_func);
b94a170e 778 INIT_WORK(&gl->gl_delete, delete_work_func);
b3b94faa 779
009d8518
SW
780 mapping = gfs2_glock2aspace(gl);
781 if (mapping) {
782 mapping->a_ops = &gfs2_meta_aops;
783 mapping->host = s->s_bdev->bd_inode;
784 mapping->flags = 0;
785 mapping_set_gfp_mask(mapping, GFP_NOFS);
786 mapping->assoc_mapping = NULL;
787 mapping->backing_dev_info = s->s_bdi;
788 mapping->writeback_index = 0;
b3b94faa
DT
789 }
790
bc015cb8 791 spin_lock_bucket(hash);
37b2fa6a 792 tmp = search_bucket(hash, sdp, &name);
b3b94faa 793 if (tmp) {
bc015cb8
SW
794 spin_unlock_bucket(hash);
795 kmem_cache_free(cachep, gl);
fc0e38da 796 atomic_dec(&sdp->sd_glock_disposal);
b3b94faa
DT
797 gl = tmp;
798 } else {
bc015cb8
SW
799 hlist_bl_add_head_rcu(&gl->gl_list, &gl_hash_table[hash]);
800 spin_unlock_bucket(hash);
b3b94faa
DT
801 }
802
803 *glp = gl;
804
805 return 0;
b3b94faa
DT
806}
807
808/**
809 * gfs2_holder_init - initialize a struct gfs2_holder in the default way
810 * @gl: the glock
811 * @state: the state we're requesting
812 * @flags: the modifier flags
813 * @gh: the holder structure
814 *
815 */
816
190562bd 817void gfs2_holder_init(struct gfs2_glock *gl, unsigned int state, unsigned flags,
b3b94faa
DT
818 struct gfs2_holder *gh)
819{
820 INIT_LIST_HEAD(&gh->gh_list);
821 gh->gh_gl = gl;
d0dc80db 822 gh->gh_ip = (unsigned long)__builtin_return_address(0);
b1e058da 823 gh->gh_owner_pid = get_pid(task_pid(current));
b3b94faa
DT
824 gh->gh_state = state;
825 gh->gh_flags = flags;
826 gh->gh_error = 0;
827 gh->gh_iflags = 0;
b3b94faa
DT
828 gfs2_glock_hold(gl);
829}
830
831/**
832 * gfs2_holder_reinit - reinitialize a struct gfs2_holder so we can requeue it
833 * @state: the state we're requesting
834 * @flags: the modifier flags
835 * @gh: the holder structure
836 *
837 * Don't mess with the glock.
838 *
839 */
840
190562bd 841void gfs2_holder_reinit(unsigned int state, unsigned flags, struct gfs2_holder *gh)
b3b94faa
DT
842{
843 gh->gh_state = state;
579b78a4 844 gh->gh_flags = flags;
3b8249f6 845 gh->gh_iflags = 0;
d0dc80db 846 gh->gh_ip = (unsigned long)__builtin_return_address(0);
1a0eae88
BP
847 if (gh->gh_owner_pid)
848 put_pid(gh->gh_owner_pid);
849 gh->gh_owner_pid = get_pid(task_pid(current));
b3b94faa
DT
850}
851
852/**
853 * gfs2_holder_uninit - uninitialize a holder structure (drop glock reference)
854 * @gh: the holder structure
855 *
856 */
857
858void gfs2_holder_uninit(struct gfs2_holder *gh)
859{
b1e058da 860 put_pid(gh->gh_owner_pid);
b3b94faa
DT
861 gfs2_glock_put(gh->gh_gl);
862 gh->gh_gl = NULL;
d0dc80db 863 gh->gh_ip = 0;
b3b94faa
DT
864}
865
fe64d517
SW
866/**
867 * gfs2_glock_holder_wait
868 * @word: unused
869 *
870 * This function and gfs2_glock_demote_wait both show up in the WCHAN
871 * field. Thus I've separated these otherwise identical functions in
872 * order to be more informative to the user.
873 */
874
875static int gfs2_glock_holder_wait(void *word)
fee852e3
SW
876{
877 schedule();
878 return 0;
879}
880
fe64d517
SW
881static int gfs2_glock_demote_wait(void *word)
882{
883 schedule();
884 return 0;
885}
886
6802e340 887static void wait_on_holder(struct gfs2_holder *gh)
da755fdb 888{
7cf8dcd3
BP
889 unsigned long time1 = jiffies;
890
6802e340 891 might_sleep();
fe64d517 892 wait_on_bit(&gh->gh_iflags, HIF_WAIT, gfs2_glock_holder_wait, TASK_UNINTERRUPTIBLE);
7cf8dcd3
BP
893 if (time_after(jiffies, time1 + HZ)) /* have we waited > a second? */
894 /* Lengthen the minimum hold time. */
895 gh->gh_gl->gl_hold_time = min(gh->gh_gl->gl_hold_time +
896 GL_GLOCK_HOLD_INCR,
897 GL_GLOCK_MAX_HOLD);
da755fdb
SW
898}
899
6802e340 900static void wait_on_demote(struct gfs2_glock *gl)
b3b94faa 901{
6802e340 902 might_sleep();
fe64d517 903 wait_on_bit(&gl->gl_flags, GLF_DEMOTE, gfs2_glock_demote_wait, TASK_UNINTERRUPTIBLE);
b3b94faa
DT
904}
905
906/**
6802e340
SW
907 * handle_callback - process a demote request
908 * @gl: the glock
909 * @state: the state the caller wants us to change to
b3b94faa 910 *
6802e340
SW
911 * There are only two requests that we are going to see in actual
912 * practise: LM_ST_SHARED and LM_ST_UNLOCKED
b3b94faa
DT
913 */
914
6802e340 915static void handle_callback(struct gfs2_glock *gl, unsigned int state,
97cc1025 916 unsigned long delay)
b3b94faa 917{
6802e340 918 int bit = delay ? GLF_PENDING_DEMOTE : GLF_DEMOTE;
b3b94faa 919
6802e340
SW
920 set_bit(bit, &gl->gl_flags);
921 if (gl->gl_demote_state == LM_ST_EXCLUSIVE) {
922 gl->gl_demote_state = state;
923 gl->gl_demote_time = jiffies;
6802e340
SW
924 } else if (gl->gl_demote_state != LM_ST_UNLOCKED &&
925 gl->gl_demote_state != state) {
926 gl->gl_demote_state = LM_ST_UNLOCKED;
b3b94faa 927 }
b94a170e
BM
928 if (gl->gl_ops->go_callback)
929 gl->gl_ops->go_callback(gl);
63997775 930 trace_gfs2_demote_rq(gl);
b3b94faa
DT
931}
932
933/**
6802e340 934 * gfs2_glock_wait - wait on a glock acquisition
b3b94faa
DT
935 * @gh: the glock holder
936 *
937 * Returns: 0 on success
938 */
939
6802e340 940int gfs2_glock_wait(struct gfs2_holder *gh)
b3b94faa 941{
fee852e3 942 wait_on_holder(gh);
b3b94faa
DT
943 return gh->gh_error;
944}
945
6802e340 946void gfs2_print_dbg(struct seq_file *seq, const char *fmt, ...)
7c52b166 947{
5e69069c 948 struct va_format vaf;
7c52b166
RP
949 va_list args;
950
951 va_start(args, fmt);
5e69069c 952
6802e340
SW
953 if (seq) {
954 struct gfs2_glock_iter *gi = seq->private;
7c52b166 955 vsprintf(gi->string, fmt, args);
ba1ddcb6 956 seq_puts(seq, gi->string);
6802e340 957 } else {
5e69069c
JP
958 vaf.fmt = fmt;
959 vaf.va = &args;
960
961 printk(KERN_ERR " %pV", &vaf);
6802e340 962 }
5e69069c 963
7c52b166
RP
964 va_end(args);
965}
966
b3b94faa
DT
967/**
968 * add_to_queue - Add a holder to the wait queue (but look for recursion)
969 * @gh: the holder structure to add
970 *
6802e340
SW
971 * Eventually we should move the recursive locking trap to a
972 * debugging option or something like that. This is the fast
973 * path and needs to have the minimum number of distractions.
974 *
b3b94faa
DT
975 */
976
6802e340 977static inline void add_to_queue(struct gfs2_holder *gh)
55ba474d
HH
978__releases(&gl->gl_spin)
979__acquires(&gl->gl_spin)
b3b94faa
DT
980{
981 struct gfs2_glock *gl = gh->gh_gl;
6802e340
SW
982 struct gfs2_sbd *sdp = gl->gl_sbd;
983 struct list_head *insert_pt = NULL;
984 struct gfs2_holder *gh2;
985 int try_lock = 0;
b3b94faa 986
b1e058da 987 BUG_ON(gh->gh_owner_pid == NULL);
fee852e3
SW
988 if (test_and_set_bit(HIF_WAIT, &gh->gh_iflags))
989 BUG();
190562bd 990
6802e340
SW
991 if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
992 if (test_bit(GLF_LOCK, &gl->gl_flags))
993 try_lock = 1;
994 if (test_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags))
995 goto fail;
996 }
997
998 list_for_each_entry(gh2, &gl->gl_holders, gh_list) {
999 if (unlikely(gh2->gh_owner_pid == gh->gh_owner_pid &&
1000 (gh->gh_gl->gl_ops->go_type != LM_TYPE_FLOCK)))
1001 goto trap_recursive;
1002 if (try_lock &&
1003 !(gh2->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) &&
1004 !may_grant(gl, gh)) {
1005fail:
1006 gh->gh_error = GLR_TRYFAILED;
1007 gfs2_holder_wake(gh);
1008 return;
b4c20166 1009 }
6802e340
SW
1010 if (test_bit(HIF_HOLDER, &gh2->gh_iflags))
1011 continue;
1012 if (unlikely((gh->gh_flags & LM_FLAG_PRIORITY) && !insert_pt))
1013 insert_pt = &gh2->gh_list;
1014 }
7b5e3d5f 1015 set_bit(GLF_QUEUED, &gl->gl_flags);
edae38a6 1016 trace_gfs2_glock_queue(gh, 1);
a245769f
SW
1017 gfs2_glstats_inc(gl, GFS2_LKS_QCOUNT);
1018 gfs2_sbstats_inc(gl, GFS2_LKS_QCOUNT);
6802e340
SW
1019 if (likely(insert_pt == NULL)) {
1020 list_add_tail(&gh->gh_list, &gl->gl_holders);
1021 if (unlikely(gh->gh_flags & LM_FLAG_PRIORITY))
1022 goto do_cancel;
1023 return;
1024 }
1025 list_add_tail(&gh->gh_list, insert_pt);
1026do_cancel:
1027 gh = list_entry(gl->gl_holders.next, struct gfs2_holder, gh_list);
1028 if (!(gh->gh_flags & LM_FLAG_PRIORITY)) {
1029 spin_unlock(&gl->gl_spin);
048bca22 1030 if (sdp->sd_lockstruct.ls_ops->lm_cancel)
f057f6cd 1031 sdp->sd_lockstruct.ls_ops->lm_cancel(gl);
6802e340 1032 spin_lock(&gl->gl_spin);
b3b94faa 1033 }
6802e340 1034 return;
b3b94faa 1035
6802e340
SW
1036trap_recursive:
1037 print_symbol(KERN_ERR "original: %s\n", gh2->gh_ip);
1038 printk(KERN_ERR "pid: %d\n", pid_nr(gh2->gh_owner_pid));
1039 printk(KERN_ERR "lock type: %d req lock state : %d\n",
1040 gh2->gh_gl->gl_name.ln_type, gh2->gh_state);
1041 print_symbol(KERN_ERR "new: %s\n", gh->gh_ip);
1042 printk(KERN_ERR "pid: %d\n", pid_nr(gh->gh_owner_pid));
1043 printk(KERN_ERR "lock type: %d req lock state : %d\n",
1044 gh->gh_gl->gl_name.ln_type, gh->gh_state);
1045 __dump_glock(NULL, gl);
1046 BUG();
b3b94faa
DT
1047}
1048
1049/**
1050 * gfs2_glock_nq - enqueue a struct gfs2_holder onto a glock (acquire a glock)
1051 * @gh: the holder structure
1052 *
1053 * if (gh->gh_flags & GL_ASYNC), this never returns an error
1054 *
1055 * Returns: 0, GLR_TRYFAILED, or errno on failure
1056 */
1057
1058int gfs2_glock_nq(struct gfs2_holder *gh)
1059{
1060 struct gfs2_glock *gl = gh->gh_gl;
1061 struct gfs2_sbd *sdp = gl->gl_sbd;
1062 int error = 0;
1063
6802e340 1064 if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
b3b94faa 1065 return -EIO;
b3b94faa 1066
f42ab085
SW
1067 if (test_bit(GLF_LRU, &gl->gl_flags))
1068 gfs2_glock_remove_from_lru(gl);
1069
b3b94faa
DT
1070 spin_lock(&gl->gl_spin);
1071 add_to_queue(gh);
0809f6ec
SW
1072 if ((LM_FLAG_NOEXP & gh->gh_flags) &&
1073 test_and_clear_bit(GLF_FROZEN, &gl->gl_flags))
1074 set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
6802e340 1075 run_queue(gl, 1);
b3b94faa
DT
1076 spin_unlock(&gl->gl_spin);
1077
6802e340
SW
1078 if (!(gh->gh_flags & GL_ASYNC))
1079 error = gfs2_glock_wait(gh);
b3b94faa 1080
b3b94faa
DT
1081 return error;
1082}
1083
1084/**
1085 * gfs2_glock_poll - poll to see if an async request has been completed
1086 * @gh: the holder
1087 *
1088 * Returns: 1 if the request is ready to be gfs2_glock_wait()ed on
1089 */
1090
1091int gfs2_glock_poll(struct gfs2_holder *gh)
1092{
6802e340 1093 return test_bit(HIF_WAIT, &gh->gh_iflags) ? 0 : 1;
b3b94faa
DT
1094}
1095
1096/**
1097 * gfs2_glock_dq - dequeue a struct gfs2_holder from a glock (release a glock)
1098 * @gh: the glock holder
1099 *
1100 */
1101
1102void gfs2_glock_dq(struct gfs2_holder *gh)
1103{
1104 struct gfs2_glock *gl = gh->gh_gl;
8fb4b536 1105 const struct gfs2_glock_operations *glops = gl->gl_ops;
c4f68a13 1106 unsigned delay = 0;
6802e340 1107 int fast_path = 0;
b3b94faa 1108
6802e340 1109 spin_lock(&gl->gl_spin);
b3b94faa 1110 if (gh->gh_flags & GL_NOCACHE)
97cc1025 1111 handle_callback(gl, LM_ST_UNLOCKED, 0);
b3b94faa 1112
b3b94faa 1113 list_del_init(&gh->gh_list);
6802e340 1114 if (find_first_holder(gl) == NULL) {
3042a2cc 1115 if (glops->go_unlock) {
6802e340 1116 GLOCK_BUG_ON(gl, test_and_set_bit(GLF_LOCK, &gl->gl_flags));
3042a2cc 1117 spin_unlock(&gl->gl_spin);
b3b94faa 1118 glops->go_unlock(gh);
3042a2cc 1119 spin_lock(&gl->gl_spin);
6802e340 1120 clear_bit(GLF_LOCK, &gl->gl_flags);
3042a2cc 1121 }
6802e340
SW
1122 if (list_empty(&gl->gl_holders) &&
1123 !test_bit(GLF_PENDING_DEMOTE, &gl->gl_flags) &&
1124 !test_bit(GLF_DEMOTE, &gl->gl_flags))
1125 fast_path = 1;
b3b94faa 1126 }
f42ab085
SW
1127 if (!test_bit(GLF_LFLUSH, &gl->gl_flags))
1128 __gfs2_glock_schedule_for_reclaim(gl);
63997775 1129 trace_gfs2_glock_queue(gh, 0);
b3b94faa 1130 spin_unlock(&gl->gl_spin);
6802e340
SW
1131 if (likely(fast_path))
1132 return;
c4f68a13
BM
1133
1134 gfs2_glock_hold(gl);
1135 if (test_bit(GLF_PENDING_DEMOTE, &gl->gl_flags) &&
7cf8dcd3
BP
1136 !test_bit(GLF_DEMOTE, &gl->gl_flags) &&
1137 gl->gl_name.ln_type == LM_TYPE_INODE)
1138 delay = gl->gl_hold_time;
c4f68a13
BM
1139 if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
1140 gfs2_glock_put(gl);
b3b94faa
DT
1141}
1142
d93cfa98
AD
1143void gfs2_glock_dq_wait(struct gfs2_holder *gh)
1144{
1145 struct gfs2_glock *gl = gh->gh_gl;
1146 gfs2_glock_dq(gh);
1147 wait_on_demote(gl);
1148}
1149
b3b94faa
DT
1150/**
1151 * gfs2_glock_dq_uninit - dequeue a holder from a glock and initialize it
1152 * @gh: the holder structure
1153 *
1154 */
1155
1156void gfs2_glock_dq_uninit(struct gfs2_holder *gh)
1157{
1158 gfs2_glock_dq(gh);
1159 gfs2_holder_uninit(gh);
1160}
1161
1162/**
1163 * gfs2_glock_nq_num - acquire a glock based on lock number
1164 * @sdp: the filesystem
1165 * @number: the lock number
1166 * @glops: the glock operations for the type of glock
1167 * @state: the state to acquire the glock in
25985edc 1168 * @flags: modifier flags for the acquisition
b3b94faa
DT
1169 * @gh: the struct gfs2_holder
1170 *
1171 * Returns: errno
1172 */
1173
cd915493 1174int gfs2_glock_nq_num(struct gfs2_sbd *sdp, u64 number,
8fb4b536
SW
1175 const struct gfs2_glock_operations *glops,
1176 unsigned int state, int flags, struct gfs2_holder *gh)
b3b94faa
DT
1177{
1178 struct gfs2_glock *gl;
1179 int error;
1180
1181 error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
1182 if (!error) {
1183 error = gfs2_glock_nq_init(gl, state, flags, gh);
1184 gfs2_glock_put(gl);
1185 }
1186
1187 return error;
1188}
1189
1190/**
1191 * glock_compare - Compare two struct gfs2_glock structures for sorting
1192 * @arg_a: the first structure
1193 * @arg_b: the second structure
1194 *
1195 */
1196
1197static int glock_compare(const void *arg_a, const void *arg_b)
1198{
a5e08a9e
SW
1199 const struct gfs2_holder *gh_a = *(const struct gfs2_holder **)arg_a;
1200 const struct gfs2_holder *gh_b = *(const struct gfs2_holder **)arg_b;
1201 const struct lm_lockname *a = &gh_a->gh_gl->gl_name;
1202 const struct lm_lockname *b = &gh_b->gh_gl->gl_name;
b3b94faa
DT
1203
1204 if (a->ln_number > b->ln_number)
a5e08a9e
SW
1205 return 1;
1206 if (a->ln_number < b->ln_number)
1207 return -1;
1c0f4872 1208 BUG_ON(gh_a->gh_gl->gl_ops->go_type == gh_b->gh_gl->gl_ops->go_type);
a5e08a9e 1209 return 0;
b3b94faa
DT
1210}
1211
1212/**
1213 * nq_m_sync - synchonously acquire more than one glock in deadlock free order
1214 * @num_gh: the number of structures
1215 * @ghs: an array of struct gfs2_holder structures
1216 *
1217 * Returns: 0 on success (all glocks acquired),
1218 * errno on failure (no glocks acquired)
1219 */
1220
1221static int nq_m_sync(unsigned int num_gh, struct gfs2_holder *ghs,
1222 struct gfs2_holder **p)
1223{
1224 unsigned int x;
1225 int error = 0;
1226
1227 for (x = 0; x < num_gh; x++)
1228 p[x] = &ghs[x];
1229
1230 sort(p, num_gh, sizeof(struct gfs2_holder *), glock_compare, NULL);
1231
1232 for (x = 0; x < num_gh; x++) {
1233 p[x]->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1234
1235 error = gfs2_glock_nq(p[x]);
1236 if (error) {
1237 while (x--)
1238 gfs2_glock_dq(p[x]);
1239 break;
1240 }
1241 }
1242
1243 return error;
1244}
1245
1246/**
1247 * gfs2_glock_nq_m - acquire multiple glocks
1248 * @num_gh: the number of structures
1249 * @ghs: an array of struct gfs2_holder structures
1250 *
b3b94faa
DT
1251 *
1252 * Returns: 0 on success (all glocks acquired),
1253 * errno on failure (no glocks acquired)
1254 */
1255
1256int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1257{
eaf5bd3c
SW
1258 struct gfs2_holder *tmp[4];
1259 struct gfs2_holder **pph = tmp;
b3b94faa
DT
1260 int error = 0;
1261
eaf5bd3c
SW
1262 switch(num_gh) {
1263 case 0:
b3b94faa 1264 return 0;
eaf5bd3c 1265 case 1:
b3b94faa
DT
1266 ghs->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1267 return gfs2_glock_nq(ghs);
eaf5bd3c
SW
1268 default:
1269 if (num_gh <= 4)
b3b94faa 1270 break;
eaf5bd3c
SW
1271 pph = kmalloc(num_gh * sizeof(struct gfs2_holder *), GFP_NOFS);
1272 if (!pph)
1273 return -ENOMEM;
b3b94faa
DT
1274 }
1275
eaf5bd3c 1276 error = nq_m_sync(num_gh, ghs, pph);
b3b94faa 1277
eaf5bd3c
SW
1278 if (pph != tmp)
1279 kfree(pph);
b3b94faa
DT
1280
1281 return error;
1282}
1283
1284/**
1285 * gfs2_glock_dq_m - release multiple glocks
1286 * @num_gh: the number of structures
1287 * @ghs: an array of struct gfs2_holder structures
1288 *
1289 */
1290
1291void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1292{
fa1bbdea
BP
1293 while (num_gh--)
1294 gfs2_glock_dq(&ghs[num_gh]);
b3b94faa
DT
1295}
1296
1297/**
1298 * gfs2_glock_dq_uninit_m - release multiple glocks
1299 * @num_gh: the number of structures
1300 * @ghs: an array of struct gfs2_holder structures
1301 *
1302 */
1303
1304void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
1305{
fa1bbdea
BP
1306 while (num_gh--)
1307 gfs2_glock_dq_uninit(&ghs[num_gh]);
b3b94faa
DT
1308}
1309
f057f6cd 1310void gfs2_glock_cb(struct gfs2_glock *gl, unsigned int state)
da755fdb 1311{
c4f68a13
BM
1312 unsigned long delay = 0;
1313 unsigned long holdtime;
1314 unsigned long now = jiffies;
b3b94faa 1315
f057f6cd 1316 gfs2_glock_hold(gl);
7cf8dcd3
BP
1317 holdtime = gl->gl_tchange + gl->gl_hold_time;
1318 if (test_bit(GLF_QUEUED, &gl->gl_flags) &&
1319 gl->gl_name.ln_type == LM_TYPE_INODE) {
7b5e3d5f
SW
1320 if (time_before(now, holdtime))
1321 delay = holdtime - now;
1322 if (test_bit(GLF_REPLY_PENDING, &gl->gl_flags))
7cf8dcd3 1323 delay = gl->gl_hold_time;
7b5e3d5f 1324 }
b3b94faa 1325
6802e340 1326 spin_lock(&gl->gl_spin);
97cc1025 1327 handle_callback(gl, state, delay);
6802e340 1328 spin_unlock(&gl->gl_spin);
c4f68a13
BM
1329 if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
1330 gfs2_glock_put(gl);
b3b94faa
DT
1331}
1332
0809f6ec
SW
1333/**
1334 * gfs2_should_freeze - Figure out if glock should be frozen
1335 * @gl: The glock in question
1336 *
1337 * Glocks are not frozen if (a) the result of the dlm operation is
1338 * an error, (b) the locking operation was an unlock operation or
1339 * (c) if there is a "noexp" flagged request anywhere in the queue
1340 *
1341 * Returns: 1 if freezing should occur, 0 otherwise
1342 */
1343
1344static int gfs2_should_freeze(const struct gfs2_glock *gl)
1345{
1346 const struct gfs2_holder *gh;
1347
1348 if (gl->gl_reply & ~LM_OUT_ST_MASK)
1349 return 0;
1350 if (gl->gl_target == LM_ST_UNLOCKED)
1351 return 0;
1352
1353 list_for_each_entry(gh, &gl->gl_holders, gh_list) {
1354 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
1355 continue;
1356 if (LM_FLAG_NOEXP & gh->gh_flags)
1357 return 0;
1358 }
1359
1360 return 1;
1361}
1362
b3b94faa 1363/**
f057f6cd
SW
1364 * gfs2_glock_complete - Callback used by locking
1365 * @gl: Pointer to the glock
1366 * @ret: The return value from the dlm
b3b94faa 1367 *
47a25380
SW
1368 * The gl_reply field is under the gl_spin lock so that it is ok
1369 * to use a bitfield shared with other glock state fields.
b3b94faa
DT
1370 */
1371
f057f6cd 1372void gfs2_glock_complete(struct gfs2_glock *gl, int ret)
b3b94faa 1373{
f057f6cd 1374 struct lm_lockstruct *ls = &gl->gl_sbd->sd_lockstruct;
0809f6ec 1375
47a25380 1376 spin_lock(&gl->gl_spin);
f057f6cd 1377 gl->gl_reply = ret;
0809f6ec 1378
e0c2a9aa 1379 if (unlikely(test_bit(DFL_BLOCK_LOCKS, &ls->ls_recover_flags))) {
0809f6ec 1380 if (gfs2_should_freeze(gl)) {
f057f6cd 1381 set_bit(GLF_FROZEN, &gl->gl_flags);
0809f6ec 1382 spin_unlock(&gl->gl_spin);
b3b94faa 1383 return;
0809f6ec 1384 }
b3b94faa 1385 }
47a25380
SW
1386
1387 spin_unlock(&gl->gl_spin);
f057f6cd 1388 set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
47a25380 1389 smp_wmb();
f057f6cd
SW
1390 gfs2_glock_hold(gl);
1391 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1392 gfs2_glock_put(gl);
b3b94faa
DT
1393}
1394
b3b94faa 1395
1495f230
YH
1396static int gfs2_shrink_glock_memory(struct shrinker *shrink,
1397 struct shrink_control *sc)
b3b94faa
DT
1398{
1399 struct gfs2_glock *gl;
97cc1025
SW
1400 int may_demote;
1401 int nr_skipped = 0;
1495f230
YH
1402 int nr = sc->nr_to_scan;
1403 gfp_t gfp_mask = sc->gfp_mask;
97cc1025 1404 LIST_HEAD(skipped);
b3b94faa 1405
97cc1025
SW
1406 if (nr == 0)
1407 goto out;
b3b94faa 1408
97cc1025
SW
1409 if (!(gfp_mask & __GFP_FS))
1410 return -1;
b3b94faa 1411
97cc1025
SW
1412 spin_lock(&lru_lock);
1413 while(nr && !list_empty(&lru_list)) {
1414 gl = list_entry(lru_list.next, struct gfs2_glock, gl_lru);
1415 list_del_init(&gl->gl_lru);
627c10b7 1416 clear_bit(GLF_LRU, &gl->gl_flags);
97cc1025
SW
1417 atomic_dec(&lru_count);
1418
1419 /* Test for being demotable */
1420 if (!test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
1421 gfs2_glock_hold(gl);
97cc1025
SW
1422 spin_unlock(&lru_lock);
1423 spin_lock(&gl->gl_spin);
1424 may_demote = demote_ok(gl);
97cc1025
SW
1425 if (may_demote) {
1426 handle_callback(gl, LM_ST_UNLOCKED, 0);
1427 nr--;
97cc1025 1428 }
7e71c55e
SW
1429 clear_bit(GLF_LOCK, &gl->gl_flags);
1430 smp_mb__after_clear_bit();
2163b1e6 1431 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
b94a170e
BM
1432 gfs2_glock_put_nolock(gl);
1433 spin_unlock(&gl->gl_spin);
97cc1025 1434 spin_lock(&lru_lock);
2163b1e6 1435 continue;
97cc1025 1436 }
2163b1e6
SW
1437 nr_skipped++;
1438 list_add(&gl->gl_lru, &skipped);
627c10b7 1439 set_bit(GLF_LRU, &gl->gl_flags);
b3b94faa 1440 }
97cc1025
SW
1441 list_splice(&skipped, &lru_list);
1442 atomic_add(nr_skipped, &lru_count);
1443 spin_unlock(&lru_lock);
1444out:
1445 return (atomic_read(&lru_count) / 100) * sysctl_vfs_cache_pressure;
b3b94faa
DT
1446}
1447
97cc1025
SW
1448static struct shrinker glock_shrinker = {
1449 .shrink = gfs2_shrink_glock_memory,
1450 .seeks = DEFAULT_SEEKS,
1451};
1452
b3b94faa
DT
1453/**
1454 * examine_bucket - Call a function for glock in a hash bucket
1455 * @examiner: the function
1456 * @sdp: the filesystem
1457 * @bucket: the bucket
1458 *
b3b94faa
DT
1459 */
1460
bc015cb8 1461static void examine_bucket(glock_examiner examiner, const struct gfs2_sbd *sdp,
37b2fa6a 1462 unsigned int hash)
b3b94faa 1463{
bc015cb8
SW
1464 struct gfs2_glock *gl;
1465 struct hlist_bl_head *head = &gl_hash_table[hash];
1466 struct hlist_bl_node *pos;
b3b94faa 1467
bc015cb8
SW
1468 rcu_read_lock();
1469 hlist_bl_for_each_entry_rcu(gl, pos, head, gl_list) {
1470 if ((gl->gl_sbd == sdp) && atomic_read(&gl->gl_ref))
24264434 1471 examiner(gl);
b3b94faa 1472 }
bc015cb8 1473 rcu_read_unlock();
8fbbfd21 1474 cond_resched();
bc015cb8
SW
1475}
1476
1477static void glock_hash_walk(glock_examiner examiner, const struct gfs2_sbd *sdp)
1478{
1479 unsigned x;
1480
1481 for (x = 0; x < GFS2_GL_HASH_SIZE; x++)
1482 examine_bucket(examiner, sdp, x);
b3b94faa
DT
1483}
1484
f057f6cd
SW
1485
1486/**
1487 * thaw_glock - thaw out a glock which has an unprocessed reply waiting
1488 * @gl: The glock to thaw
1489 *
1490 * N.B. When we freeze a glock, we leave a ref to the glock outstanding,
1491 * so this has to result in the ref count being dropped by one.
1492 */
1493
1494static void thaw_glock(struct gfs2_glock *gl)
1495{
1496 if (!test_and_clear_bit(GLF_FROZEN, &gl->gl_flags))
1497 return;
f057f6cd
SW
1498 set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
1499 gfs2_glock_hold(gl);
1500 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1501 gfs2_glock_put(gl);
f057f6cd
SW
1502}
1503
b3b94faa
DT
1504/**
1505 * clear_glock - look at a glock and see if we can free it from glock cache
1506 * @gl: the glock to look at
1507 *
1508 */
1509
1510static void clear_glock(struct gfs2_glock *gl)
1511{
f42ab085 1512 gfs2_glock_remove_from_lru(gl);
b3b94faa 1513
6802e340 1514 spin_lock(&gl->gl_spin);
c741c455 1515 if (gl->gl_state != LM_ST_UNLOCKED)
97cc1025 1516 handle_callback(gl, LM_ST_UNLOCKED, 0);
6802e340
SW
1517 spin_unlock(&gl->gl_spin);
1518 gfs2_glock_hold(gl);
1519 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1520 gfs2_glock_put(gl);
b3b94faa
DT
1521}
1522
f057f6cd
SW
1523/**
1524 * gfs2_glock_thaw - Thaw any frozen glocks
1525 * @sdp: The super block
1526 *
1527 */
1528
1529void gfs2_glock_thaw(struct gfs2_sbd *sdp)
1530{
bc015cb8
SW
1531 glock_hash_walk(thaw_glock, sdp);
1532}
f057f6cd 1533
bc015cb8
SW
1534static int dump_glock(struct seq_file *seq, struct gfs2_glock *gl)
1535{
1536 int ret;
1537 spin_lock(&gl->gl_spin);
1538 ret = __dump_glock(seq, gl);
1539 spin_unlock(&gl->gl_spin);
1540 return ret;
1541}
1542
1543static void dump_glock_func(struct gfs2_glock *gl)
1544{
1545 dump_glock(NULL, gl);
f057f6cd
SW
1546}
1547
b3b94faa
DT
1548/**
1549 * gfs2_gl_hash_clear - Empty out the glock hash table
1550 * @sdp: the filesystem
1551 * @wait: wait until it's all gone
1552 *
1bdad606 1553 * Called when unmounting the filesystem.
b3b94faa
DT
1554 */
1555
fefc03bf 1556void gfs2_gl_hash_clear(struct gfs2_sbd *sdp)
b3b94faa 1557{
bc015cb8 1558 glock_hash_walk(clear_glock, sdp);
8f05228e
SW
1559 flush_workqueue(glock_workqueue);
1560 wait_event(sdp->sd_glock_wait, atomic_read(&sdp->sd_glock_disposal) == 0);
bc015cb8 1561 glock_hash_walk(dump_glock_func, sdp);
b3b94faa
DT
1562}
1563
813e0c46
SW
1564void gfs2_glock_finish_truncate(struct gfs2_inode *ip)
1565{
1566 struct gfs2_glock *gl = ip->i_gl;
1567 int ret;
1568
1569 ret = gfs2_truncatei_resume(ip);
1570 gfs2_assert_withdraw(gl->gl_sbd, ret == 0);
1571
1572 spin_lock(&gl->gl_spin);
1573 clear_bit(GLF_LOCK, &gl->gl_flags);
1574 run_queue(gl, 1);
1575 spin_unlock(&gl->gl_spin);
1576}
1577
6802e340 1578static const char *state2str(unsigned state)
04b933f2 1579{
6802e340
SW
1580 switch(state) {
1581 case LM_ST_UNLOCKED:
1582 return "UN";
1583 case LM_ST_SHARED:
1584 return "SH";
1585 case LM_ST_DEFERRED:
1586 return "DF";
1587 case LM_ST_EXCLUSIVE:
1588 return "EX";
1589 }
1590 return "??";
1591}
1592
1593static const char *hflags2str(char *buf, unsigned flags, unsigned long iflags)
1594{
1595 char *p = buf;
1596 if (flags & LM_FLAG_TRY)
1597 *p++ = 't';
1598 if (flags & LM_FLAG_TRY_1CB)
1599 *p++ = 'T';
1600 if (flags & LM_FLAG_NOEXP)
1601 *p++ = 'e';
1602 if (flags & LM_FLAG_ANY)
f057f6cd 1603 *p++ = 'A';
6802e340
SW
1604 if (flags & LM_FLAG_PRIORITY)
1605 *p++ = 'p';
1606 if (flags & GL_ASYNC)
1607 *p++ = 'a';
1608 if (flags & GL_EXACT)
1609 *p++ = 'E';
6802e340
SW
1610 if (flags & GL_NOCACHE)
1611 *p++ = 'c';
1612 if (test_bit(HIF_HOLDER, &iflags))
1613 *p++ = 'H';
1614 if (test_bit(HIF_WAIT, &iflags))
1615 *p++ = 'W';
1616 if (test_bit(HIF_FIRST, &iflags))
1617 *p++ = 'F';
1618 *p = 0;
1619 return buf;
04b933f2
RP
1620}
1621
b3b94faa
DT
1622/**
1623 * dump_holder - print information about a glock holder
6802e340 1624 * @seq: the seq_file struct
b3b94faa
DT
1625 * @gh: the glock holder
1626 *
1627 * Returns: 0 on success, -ENOBUFS when we run out of space
1628 */
1629
6802e340 1630static int dump_holder(struct seq_file *seq, const struct gfs2_holder *gh)
b3b94faa 1631{
6802e340 1632 struct task_struct *gh_owner = NULL;
6802e340 1633 char flags_buf[32];
b3b94faa 1634
6802e340 1635 if (gh->gh_owner_pid)
b1e058da 1636 gh_owner = pid_task(gh->gh_owner_pid, PIDTYPE_PID);
cc18152e
JP
1637 gfs2_print_dbg(seq, " H: s:%s f:%s e:%d p:%ld [%s] %pS\n",
1638 state2str(gh->gh_state),
1639 hflags2str(flags_buf, gh->gh_flags, gh->gh_iflags),
1640 gh->gh_error,
1641 gh->gh_owner_pid ? (long)pid_nr(gh->gh_owner_pid) : -1,
1642 gh_owner ? gh_owner->comm : "(ended)",
1643 (void *)gh->gh_ip);
7c52b166 1644 return 0;
b3b94faa
DT
1645}
1646
627c10b7 1647static const char *gflags2str(char *buf, const struct gfs2_glock *gl)
6802e340 1648{
627c10b7 1649 const unsigned long *gflags = &gl->gl_flags;
6802e340 1650 char *p = buf;
627c10b7 1651
6802e340
SW
1652 if (test_bit(GLF_LOCK, gflags))
1653 *p++ = 'l';
6802e340
SW
1654 if (test_bit(GLF_DEMOTE, gflags))
1655 *p++ = 'D';
1656 if (test_bit(GLF_PENDING_DEMOTE, gflags))
1657 *p++ = 'd';
1658 if (test_bit(GLF_DEMOTE_IN_PROGRESS, gflags))
1659 *p++ = 'p';
1660 if (test_bit(GLF_DIRTY, gflags))
1661 *p++ = 'y';
1662 if (test_bit(GLF_LFLUSH, gflags))
1663 *p++ = 'f';
1664 if (test_bit(GLF_INVALIDATE_IN_PROGRESS, gflags))
1665 *p++ = 'i';
1666 if (test_bit(GLF_REPLY_PENDING, gflags))
1667 *p++ = 'r';
f057f6cd 1668 if (test_bit(GLF_INITIAL, gflags))
d8348de0 1669 *p++ = 'I';
f057f6cd
SW
1670 if (test_bit(GLF_FROZEN, gflags))
1671 *p++ = 'F';
7b5e3d5f
SW
1672 if (test_bit(GLF_QUEUED, gflags))
1673 *p++ = 'q';
627c10b7
SW
1674 if (test_bit(GLF_LRU, gflags))
1675 *p++ = 'L';
1676 if (gl->gl_object)
1677 *p++ = 'o';
a245769f
SW
1678 if (test_bit(GLF_BLOCKING, gflags))
1679 *p++ = 'b';
6802e340
SW
1680 *p = 0;
1681 return buf;
b3b94faa
DT
1682}
1683
1684/**
6802e340
SW
1685 * __dump_glock - print information about a glock
1686 * @seq: The seq_file struct
b3b94faa 1687 * @gl: the glock
6802e340
SW
1688 *
1689 * The file format is as follows:
1690 * One line per object, capital letters are used to indicate objects
1691 * G = glock, I = Inode, R = rgrp, H = holder. Glocks are not indented,
1692 * other objects are indented by a single space and follow the glock to
1693 * which they are related. Fields are indicated by lower case letters
1694 * followed by a colon and the field value, except for strings which are in
1695 * [] so that its possible to see if they are composed of spaces for
1696 * example. The field's are n = number (id of the object), f = flags,
1697 * t = type, s = state, r = refcount, e = error, p = pid.
b3b94faa
DT
1698 *
1699 * Returns: 0 on success, -ENOBUFS when we run out of space
1700 */
1701
6802e340 1702static int __dump_glock(struct seq_file *seq, const struct gfs2_glock *gl)
b3b94faa 1703{
6802e340
SW
1704 const struct gfs2_glock_operations *glops = gl->gl_ops;
1705 unsigned long long dtime;
1706 const struct gfs2_holder *gh;
1707 char gflags_buf[32];
1708 int error = 0;
b3b94faa 1709
6802e340
SW
1710 dtime = jiffies - gl->gl_demote_time;
1711 dtime *= 1000000/HZ; /* demote time in uSec */
1712 if (!test_bit(GLF_DEMOTE, &gl->gl_flags))
1713 dtime = 0;
7cf8dcd3 1714 gfs2_print_dbg(seq, "G: s:%s n:%u/%llx f:%s t:%s d:%s/%llu a:%d v:%d r:%d m:%ld\n",
6802e340
SW
1715 state2str(gl->gl_state),
1716 gl->gl_name.ln_type,
1717 (unsigned long long)gl->gl_name.ln_number,
627c10b7 1718 gflags2str(gflags_buf, gl),
6802e340
SW
1719 state2str(gl->gl_target),
1720 state2str(gl->gl_demote_state), dtime,
6802e340 1721 atomic_read(&gl->gl_ail_count),
f42ab085 1722 atomic_read(&gl->gl_revokes),
7cf8dcd3 1723 atomic_read(&gl->gl_ref), gl->gl_hold_time);
b3b94faa 1724
b3b94faa 1725 list_for_each_entry(gh, &gl->gl_holders, gh_list) {
6802e340 1726 error = dump_holder(seq, gh);
b3b94faa
DT
1727 if (error)
1728 goto out;
1729 }
6802e340
SW
1730 if (gl->gl_state != LM_ST_UNLOCKED && glops->go_dump)
1731 error = glops->go_dump(seq, gl);
a91ea69f 1732out:
b3b94faa
DT
1733 return error;
1734}
1735
a245769f
SW
1736static int gfs2_glstats_seq_show(struct seq_file *seq, void *iter_ptr)
1737{
1738 struct gfs2_glock *gl = iter_ptr;
1739
1740 seq_printf(seq, "G: n:%u/%llx rtt:%lld/%lld rttb:%lld/%lld irt:%lld/%lld dcnt: %lld qcnt: %lld\n",
1741 gl->gl_name.ln_type,
1742 (unsigned long long)gl->gl_name.ln_number,
1743 (long long)gl->gl_stats.stats[GFS2_LKS_SRTT],
1744 (long long)gl->gl_stats.stats[GFS2_LKS_SRTTVAR],
1745 (long long)gl->gl_stats.stats[GFS2_LKS_SRTTB],
1746 (long long)gl->gl_stats.stats[GFS2_LKS_SRTTVARB],
1747 (long long)gl->gl_stats.stats[GFS2_LKS_SIRT],
1748 (long long)gl->gl_stats.stats[GFS2_LKS_SIRTVAR],
1749 (long long)gl->gl_stats.stats[GFS2_LKS_DCOUNT],
1750 (long long)gl->gl_stats.stats[GFS2_LKS_QCOUNT]);
1751 return 0;
1752}
1753
1754static const char *gfs2_gltype[] = {
1755 "type",
1756 "reserved",
1757 "nondisk",
1758 "inode",
1759 "rgrp",
1760 "meta",
1761 "iopen",
1762 "flock",
1763 "plock",
1764 "quota",
1765 "journal",
1766};
1767
1768static const char *gfs2_stype[] = {
1769 [GFS2_LKS_SRTT] = "srtt",
1770 [GFS2_LKS_SRTTVAR] = "srttvar",
1771 [GFS2_LKS_SRTTB] = "srttb",
1772 [GFS2_LKS_SRTTVARB] = "srttvarb",
1773 [GFS2_LKS_SIRT] = "sirt",
1774 [GFS2_LKS_SIRTVAR] = "sirtvar",
1775 [GFS2_LKS_DCOUNT] = "dlm",
1776 [GFS2_LKS_QCOUNT] = "queue",
1777};
1778
1779#define GFS2_NR_SBSTATS (ARRAY_SIZE(gfs2_gltype) * ARRAY_SIZE(gfs2_stype))
1780
1781static int gfs2_sbstats_seq_show(struct seq_file *seq, void *iter_ptr)
1782{
1783 struct gfs2_glock_iter *gi = seq->private;
1784 struct gfs2_sbd *sdp = gi->sdp;
1785 unsigned index = gi->hash >> 3;
1786 unsigned subindex = gi->hash & 0x07;
1787 s64 value;
1788 int i;
1789
1790 if (index == 0 && subindex != 0)
1791 return 0;
6802e340 1792
a245769f
SW
1793 seq_printf(seq, "%-10s %8s:", gfs2_gltype[index],
1794 (index == 0) ? "cpu": gfs2_stype[subindex]);
b3b94faa 1795
a245769f
SW
1796 for_each_possible_cpu(i) {
1797 const struct gfs2_pcpu_lkstats *lkstats = per_cpu_ptr(sdp->sd_lkstats, i);
1798 if (index == 0) {
1799 value = i;
1800 } else {
1801 value = lkstats->lkstats[index - 1].stats[subindex];
1802 }
1803 seq_printf(seq, " %15lld", (long long)value);
1804 }
1805 seq_putc(seq, '\n');
1806 return 0;
1807}
8fbbfd21 1808
85d1da67
SW
1809int __init gfs2_glock_init(void)
1810{
1811 unsigned i;
1812 for(i = 0; i < GFS2_GL_HASH_SIZE; i++) {
bc015cb8 1813 INIT_HLIST_BL_HEAD(&gl_hash_table[i]);
087efdd3 1814 }
8fbbfd21 1815
d2115778 1816 glock_workqueue = alloc_workqueue("glock_workqueue", WQ_MEM_RECLAIM |
58a69cb4 1817 WQ_HIGHPRI | WQ_FREEZABLE, 0);
97cc1025 1818 if (IS_ERR(glock_workqueue))
c4f68a13 1819 return PTR_ERR(glock_workqueue);
d2115778 1820 gfs2_delete_workqueue = alloc_workqueue("delete_workqueue",
58a69cb4 1821 WQ_MEM_RECLAIM | WQ_FREEZABLE,
d2115778 1822 0);
b94a170e
BM
1823 if (IS_ERR(gfs2_delete_workqueue)) {
1824 destroy_workqueue(glock_workqueue);
1825 return PTR_ERR(gfs2_delete_workqueue);
1826 }
97cc1025
SW
1827
1828 register_shrinker(&glock_shrinker);
c4f68a13 1829
85d1da67
SW
1830 return 0;
1831}
1832
8fbbfd21
SW
1833void gfs2_glock_exit(void)
1834{
97cc1025 1835 unregister_shrinker(&glock_shrinker);
c4f68a13 1836 destroy_workqueue(glock_workqueue);
b94a170e 1837 destroy_workqueue(gfs2_delete_workqueue);
8fbbfd21
SW
1838}
1839
bc015cb8
SW
1840static inline struct gfs2_glock *glock_hash_chain(unsigned hash)
1841{
1842 return hlist_bl_entry(hlist_bl_first_rcu(&gl_hash_table[hash]),
1843 struct gfs2_glock, gl_list);
1844}
1845
1846static inline struct gfs2_glock *glock_hash_next(struct gfs2_glock *gl)
1847{
7e32d026 1848 return hlist_bl_entry(rcu_dereference(gl->gl_list.next),
bc015cb8
SW
1849 struct gfs2_glock, gl_list);
1850}
1851
6802e340 1852static int gfs2_glock_iter_next(struct gfs2_glock_iter *gi)
7c52b166 1853{
7b08fc62
SW
1854 struct gfs2_glock *gl;
1855
bc015cb8
SW
1856 do {
1857 gl = gi->gl;
1858 if (gl) {
1859 gi->gl = glock_hash_next(gl);
ba1ddcb6 1860 gi->nhash++;
bc015cb8 1861 } else {
ba1ddcb6
SW
1862 if (gi->hash >= GFS2_GL_HASH_SIZE) {
1863 rcu_read_unlock();
1864 return 1;
1865 }
bc015cb8 1866 gi->gl = glock_hash_chain(gi->hash);
ba1ddcb6 1867 gi->nhash = 0;
bc015cb8
SW
1868 }
1869 while (gi->gl == NULL) {
1870 gi->hash++;
1871 if (gi->hash >= GFS2_GL_HASH_SIZE) {
1872 rcu_read_unlock();
1873 return 1;
1874 }
1875 gi->gl = glock_hash_chain(gi->hash);
ba1ddcb6 1876 gi->nhash = 0;
bc015cb8
SW
1877 }
1878 /* Skip entries for other sb and dead entries */
1879 } while (gi->sdp != gi->gl->gl_sbd || atomic_read(&gi->gl->gl_ref) == 0);
a947e033 1880
7c52b166
RP
1881 return 0;
1882}
1883
6802e340 1884static void *gfs2_glock_seq_start(struct seq_file *seq, loff_t *pos)
7c52b166 1885{
6802e340 1886 struct gfs2_glock_iter *gi = seq->private;
7c52b166
RP
1887 loff_t n = *pos;
1888
ba1ddcb6
SW
1889 if (gi->last_pos <= *pos)
1890 n = gi->nhash + (*pos - gi->last_pos);
1891 else
1892 gi->hash = 0;
1893
1894 gi->nhash = 0;
bc015cb8 1895 rcu_read_lock();
7c52b166 1896
6802e340 1897 do {
bc015cb8 1898 if (gfs2_glock_iter_next(gi))
7c52b166 1899 return NULL;
6802e340 1900 } while (n--);
7c52b166 1901
ba1ddcb6 1902 gi->last_pos = *pos;
6802e340 1903 return gi->gl;
7c52b166
RP
1904}
1905
6802e340 1906static void *gfs2_glock_seq_next(struct seq_file *seq, void *iter_ptr,
7c52b166
RP
1907 loff_t *pos)
1908{
6802e340 1909 struct gfs2_glock_iter *gi = seq->private;
7c52b166
RP
1910
1911 (*pos)++;
ba1ddcb6 1912 gi->last_pos = *pos;
bc015cb8 1913 if (gfs2_glock_iter_next(gi))
7c52b166 1914 return NULL;
7c52b166 1915
6802e340 1916 return gi->gl;
7c52b166
RP
1917}
1918
6802e340 1919static void gfs2_glock_seq_stop(struct seq_file *seq, void *iter_ptr)
7c52b166 1920{
6802e340 1921 struct gfs2_glock_iter *gi = seq->private;
bc015cb8
SW
1922
1923 if (gi->gl)
1924 rcu_read_unlock();
1925 gi->gl = NULL;
7c52b166
RP
1926}
1927
6802e340 1928static int gfs2_glock_seq_show(struct seq_file *seq, void *iter_ptr)
7c52b166 1929{
6802e340 1930 return dump_glock(seq, iter_ptr);
7c52b166
RP
1931}
1932
a245769f
SW
1933static void *gfs2_sbstats_seq_start(struct seq_file *seq, loff_t *pos)
1934{
1935 struct gfs2_glock_iter *gi = seq->private;
1936
1937 gi->hash = *pos;
1938 if (*pos >= GFS2_NR_SBSTATS)
1939 return NULL;
1940 preempt_disable();
1941 return SEQ_START_TOKEN;
1942}
1943
1944static void *gfs2_sbstats_seq_next(struct seq_file *seq, void *iter_ptr,
1945 loff_t *pos)
1946{
1947 struct gfs2_glock_iter *gi = seq->private;
1948 (*pos)++;
1949 gi->hash++;
1950 if (gi->hash >= GFS2_NR_SBSTATS) {
1951 preempt_enable();
1952 return NULL;
1953 }
1954 return SEQ_START_TOKEN;
1955}
1956
1957static void gfs2_sbstats_seq_stop(struct seq_file *seq, void *iter_ptr)
1958{
1959 preempt_enable();
1960}
1961
4ef29002 1962static const struct seq_operations gfs2_glock_seq_ops = {
7c52b166
RP
1963 .start = gfs2_glock_seq_start,
1964 .next = gfs2_glock_seq_next,
1965 .stop = gfs2_glock_seq_stop,
1966 .show = gfs2_glock_seq_show,
1967};
1968
a245769f
SW
1969static const struct seq_operations gfs2_glstats_seq_ops = {
1970 .start = gfs2_glock_seq_start,
1971 .next = gfs2_glock_seq_next,
1972 .stop = gfs2_glock_seq_stop,
1973 .show = gfs2_glstats_seq_show,
1974};
1975
1976static const struct seq_operations gfs2_sbstats_seq_ops = {
1977 .start = gfs2_sbstats_seq_start,
1978 .next = gfs2_sbstats_seq_next,
1979 .stop = gfs2_sbstats_seq_stop,
1980 .show = gfs2_sbstats_seq_show,
1981};
1982
1983static int gfs2_glocks_open(struct inode *inode, struct file *file)
7c52b166 1984{
6802e340
SW
1985 int ret = seq_open_private(file, &gfs2_glock_seq_ops,
1986 sizeof(struct gfs2_glock_iter));
1987 if (ret == 0) {
1988 struct seq_file *seq = file->private_data;
1989 struct gfs2_glock_iter *gi = seq->private;
1990 gi->sdp = inode->i_private;
df5d2f55
SW
1991 seq->buf = kmalloc(8*PAGE_SIZE, GFP_KERNEL | __GFP_NOWARN);
1992 if (seq->buf)
1993 seq->size = 8*PAGE_SIZE;
6802e340
SW
1994 }
1995 return ret;
7c52b166
RP
1996}
1997
a245769f
SW
1998static int gfs2_glstats_open(struct inode *inode, struct file *file)
1999{
2000 int ret = seq_open_private(file, &gfs2_glstats_seq_ops,
2001 sizeof(struct gfs2_glock_iter));
2002 if (ret == 0) {
2003 struct seq_file *seq = file->private_data;
2004 struct gfs2_glock_iter *gi = seq->private;
2005 gi->sdp = inode->i_private;
df5d2f55
SW
2006 seq->buf = kmalloc(8*PAGE_SIZE, GFP_KERNEL | __GFP_NOWARN);
2007 if (seq->buf)
2008 seq->size = 8*PAGE_SIZE;
a245769f
SW
2009 }
2010 return ret;
2011}
2012
2013static int gfs2_sbstats_open(struct inode *inode, struct file *file)
2014{
2015 int ret = seq_open_private(file, &gfs2_sbstats_seq_ops,
2016 sizeof(struct gfs2_glock_iter));
2017 if (ret == 0) {
2018 struct seq_file *seq = file->private_data;
2019 struct gfs2_glock_iter *gi = seq->private;
2020 gi->sdp = inode->i_private;
2021 }
2022 return ret;
2023}
2024
2025static const struct file_operations gfs2_glocks_fops = {
2026 .owner = THIS_MODULE,
2027 .open = gfs2_glocks_open,
2028 .read = seq_read,
2029 .llseek = seq_lseek,
2030 .release = seq_release_private,
2031};
2032
2033static const struct file_operations gfs2_glstats_fops = {
7c52b166 2034 .owner = THIS_MODULE,
a245769f
SW
2035 .open = gfs2_glstats_open,
2036 .read = seq_read,
2037 .llseek = seq_lseek,
2038 .release = seq_release_private,
2039};
2040
2041static const struct file_operations gfs2_sbstats_fops = {
2042 .owner = THIS_MODULE,
2043 .open = gfs2_sbstats_open,
7c52b166
RP
2044 .read = seq_read,
2045 .llseek = seq_lseek,
6802e340 2046 .release = seq_release_private,
7c52b166
RP
2047};
2048
2049int gfs2_create_debugfs_file(struct gfs2_sbd *sdp)
2050{
5f882096
RP
2051 sdp->debugfs_dir = debugfs_create_dir(sdp->sd_table_name, gfs2_root);
2052 if (!sdp->debugfs_dir)
2053 return -ENOMEM;
2054 sdp->debugfs_dentry_glocks = debugfs_create_file("glocks",
2055 S_IFREG | S_IRUGO,
2056 sdp->debugfs_dir, sdp,
a245769f 2057 &gfs2_glocks_fops);
5f882096 2058 if (!sdp->debugfs_dentry_glocks)
a245769f
SW
2059 goto fail;
2060
2061 sdp->debugfs_dentry_glstats = debugfs_create_file("glstats",
2062 S_IFREG | S_IRUGO,
2063 sdp->debugfs_dir, sdp,
2064 &gfs2_glstats_fops);
2065 if (!sdp->debugfs_dentry_glstats)
2066 goto fail;
2067
2068 sdp->debugfs_dentry_sbstats = debugfs_create_file("sbstats",
2069 S_IFREG | S_IRUGO,
2070 sdp->debugfs_dir, sdp,
2071 &gfs2_sbstats_fops);
2072 if (!sdp->debugfs_dentry_sbstats)
2073 goto fail;
7c52b166
RP
2074
2075 return 0;
a245769f
SW
2076fail:
2077 gfs2_delete_debugfs_file(sdp);
2078 return -ENOMEM;
7c52b166
RP
2079}
2080
2081void gfs2_delete_debugfs_file(struct gfs2_sbd *sdp)
2082{
a245769f 2083 if (sdp->debugfs_dir) {
5f882096
RP
2084 if (sdp->debugfs_dentry_glocks) {
2085 debugfs_remove(sdp->debugfs_dentry_glocks);
2086 sdp->debugfs_dentry_glocks = NULL;
2087 }
a245769f
SW
2088 if (sdp->debugfs_dentry_glstats) {
2089 debugfs_remove(sdp->debugfs_dentry_glstats);
2090 sdp->debugfs_dentry_glstats = NULL;
2091 }
2092 if (sdp->debugfs_dentry_sbstats) {
2093 debugfs_remove(sdp->debugfs_dentry_sbstats);
2094 sdp->debugfs_dentry_sbstats = NULL;
2095 }
5f882096
RP
2096 debugfs_remove(sdp->debugfs_dir);
2097 sdp->debugfs_dir = NULL;
2098 }
7c52b166
RP
2099}
2100
2101int gfs2_register_debugfs(void)
2102{
2103 gfs2_root = debugfs_create_dir("gfs2", NULL);
2104 return gfs2_root ? 0 : -ENOMEM;
2105}
2106
2107void gfs2_unregister_debugfs(void)
2108{
2109 debugfs_remove(gfs2_root);
5f882096 2110 gfs2_root = NULL;
7c52b166 2111}