]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blame - fs/xfs/xfs_qm.c
xfs: Define a new function xfs_is_quota_inode()
[mirror_ubuntu-zesty-kernel.git] / fs / xfs / xfs_qm.c
CommitLineData
1da177e4 1/*
4ce3121f
NS
2 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
3 * All Rights Reserved.
1da177e4 4 *
4ce3121f
NS
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
1da177e4
LT
7 * published by the Free Software Foundation.
8 *
4ce3121f
NS
9 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
1da177e4 13 *
4ce3121f
NS
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
1da177e4 17 */
1da177e4
LT
18#include "xfs.h"
19#include "xfs_fs.h"
a844f451 20#include "xfs_bit.h"
1da177e4 21#include "xfs_log.h"
1da177e4
LT
22#include "xfs_trans.h"
23#include "xfs_sb.h"
24#include "xfs_ag.h"
1da177e4 25#include "xfs_alloc.h"
1da177e4
LT
26#include "xfs_quota.h"
27#include "xfs_mount.h"
1da177e4
LT
28#include "xfs_bmap_btree.h"
29#include "xfs_ialloc_btree.h"
1da177e4
LT
30#include "xfs_dinode.h"
31#include "xfs_inode.h"
a844f451
NS
32#include "xfs_ialloc.h"
33#include "xfs_itable.h"
1da177e4
LT
34#include "xfs_rtalloc.h"
35#include "xfs_error.h"
a844f451 36#include "xfs_bmap.h"
1da177e4
LT
37#include "xfs_attr.h"
38#include "xfs_buf_item.h"
39#include "xfs_trans_space.h"
40#include "xfs_utils.h"
1da177e4 41#include "xfs_qm.h"
0b1b213f 42#include "xfs_trace.h"
33479e05 43#include "xfs_icache.h"
6fcdc59d 44#include "xfs_cksum.h"
1da177e4
LT
45
46/*
47 * The global quota manager. There is only one of these for the entire
48 * system, _not_ one per file system. XQM keeps track of the overall
49 * quota functionality, including maintaining the freelist and hash
50 * tables of dquots.
51 */
1da177e4 52STATIC int xfs_qm_init_quotainos(xfs_mount_t *);
ba0f32d4 53STATIC int xfs_qm_init_quotainfo(xfs_mount_t *);
1495f230 54STATIC int xfs_qm_shake(struct shrinker *, struct shrink_control *);
1da177e4 55
b84a3a96
CH
56/*
57 * We use the batch lookup interface to iterate over the dquots as it
58 * currently is the only interface into the radix tree code that allows
59 * fuzzy lookups instead of exact matches. Holding the lock over multiple
60 * operations is fine as all callers are used either during mount/umount
61 * or quotaoff.
62 */
63#define XFS_DQ_LOOKUP_BATCH 32
64
65STATIC int
66xfs_qm_dquot_walk(
67 struct xfs_mount *mp,
68 int type,
43ff2122
CH
69 int (*execute)(struct xfs_dquot *dqp, void *data),
70 void *data)
b84a3a96
CH
71{
72 struct xfs_quotainfo *qi = mp->m_quotainfo;
73 struct radix_tree_root *tree = XFS_DQUOT_TREE(qi, type);
74 uint32_t next_index;
75 int last_error = 0;
76 int skipped;
77 int nr_found;
78
79restart:
80 skipped = 0;
81 next_index = 0;
82 nr_found = 0;
83
84 while (1) {
85 struct xfs_dquot *batch[XFS_DQ_LOOKUP_BATCH];
86 int error = 0;
87 int i;
88
89 mutex_lock(&qi->qi_tree_lock);
90 nr_found = radix_tree_gang_lookup(tree, (void **)batch,
91 next_index, XFS_DQ_LOOKUP_BATCH);
92 if (!nr_found) {
93 mutex_unlock(&qi->qi_tree_lock);
94 break;
95 }
96
97 for (i = 0; i < nr_found; i++) {
98 struct xfs_dquot *dqp = batch[i];
99
100 next_index = be32_to_cpu(dqp->q_core.d_id) + 1;
101
43ff2122 102 error = execute(batch[i], data);
b84a3a96
CH
103 if (error == EAGAIN) {
104 skipped++;
105 continue;
106 }
107 if (error && last_error != EFSCORRUPTED)
108 last_error = error;
109 }
110
111 mutex_unlock(&qi->qi_tree_lock);
112
113 /* bail out if the filesystem is corrupted. */
114 if (last_error == EFSCORRUPTED) {
115 skipped = 0;
116 break;
117 }
118 }
119
120 if (skipped) {
121 delay(1);
122 goto restart;
123 }
124
125 return last_error;
126}
127
128
129/*
130 * Purge a dquot from all tracking data structures and free it.
131 */
132STATIC int
133xfs_qm_dqpurge(
43ff2122
CH
134 struct xfs_dquot *dqp,
135 void *data)
b84a3a96
CH
136{
137 struct xfs_mount *mp = dqp->q_mount;
138 struct xfs_quotainfo *qi = mp->m_quotainfo;
139 struct xfs_dquot *gdqp = NULL;
140
141 xfs_dqlock(dqp);
142 if ((dqp->dq_flags & XFS_DQ_FREEING) || dqp->q_nrefs != 0) {
143 xfs_dqunlock(dqp);
144 return EAGAIN;
145 }
146
147 /*
148 * If this quota has a group hint attached, prepare for releasing it
149 * now.
150 */
151 gdqp = dqp->q_gdquot;
152 if (gdqp) {
153 xfs_dqlock(gdqp);
154 dqp->q_gdquot = NULL;
155 }
156
157 dqp->dq_flags |= XFS_DQ_FREEING;
158
43ff2122 159 xfs_dqflock(dqp);
b84a3a96
CH
160
161 /*
162 * If we are turning this type of quotas off, we don't care
163 * about the dirty metadata sitting in this dquot. OTOH, if
164 * we're unmounting, we do care, so we flush it and wait.
165 */
166 if (XFS_DQ_IS_DIRTY(dqp)) {
fe7257fd
CH
167 struct xfs_buf *bp = NULL;
168 int error;
b84a3a96
CH
169
170 /*
171 * We don't care about getting disk errors here. We need
172 * to purge this dquot anyway, so we go ahead regardless.
173 */
fe7257fd
CH
174 error = xfs_qm_dqflush(dqp, &bp);
175 if (error) {
b84a3a96
CH
176 xfs_warn(mp, "%s: dquot %p flush failed",
177 __func__, dqp);
fe7257fd
CH
178 } else {
179 error = xfs_bwrite(bp);
180 xfs_buf_relse(bp);
181 }
b84a3a96
CH
182 xfs_dqflock(dqp);
183 }
184
185 ASSERT(atomic_read(&dqp->q_pincount) == 0);
186 ASSERT(XFS_FORCED_SHUTDOWN(mp) ||
187 !(dqp->q_logitem.qli_item.li_flags & XFS_LI_IN_AIL));
188
189 xfs_dqfunlock(dqp);
190 xfs_dqunlock(dqp);
191
192 radix_tree_delete(XFS_DQUOT_TREE(qi, dqp->q_core.d_flags),
193 be32_to_cpu(dqp->q_core.d_id));
194 qi->qi_dquots--;
195
196 /*
197 * We move dquots to the freelist as soon as their reference count
198 * hits zero, so it really should be on the freelist here.
199 */
200 mutex_lock(&qi->qi_lru_lock);
201 ASSERT(!list_empty(&dqp->q_lru));
202 list_del_init(&dqp->q_lru);
203 qi->qi_lru_count--;
204 XFS_STATS_DEC(xs_qm_dquot_unused);
205 mutex_unlock(&qi->qi_lru_lock);
206
207 xfs_qm_dqdestroy(dqp);
208
209 if (gdqp)
210 xfs_qm_dqput(gdqp);
211 return 0;
212}
213
214/*
215 * Purge the dquot cache.
216 */
217void
218xfs_qm_dqpurge_all(
219 struct xfs_mount *mp,
220 uint flags)
221{
222 if (flags & XFS_QMOPT_UQUOTA)
43ff2122 223 xfs_qm_dquot_walk(mp, XFS_DQ_USER, xfs_qm_dqpurge, NULL);
b84a3a96 224 if (flags & XFS_QMOPT_GQUOTA)
43ff2122 225 xfs_qm_dquot_walk(mp, XFS_DQ_GROUP, xfs_qm_dqpurge, NULL);
b84a3a96 226 if (flags & XFS_QMOPT_PQUOTA)
43ff2122 227 xfs_qm_dquot_walk(mp, XFS_DQ_PROJ, xfs_qm_dqpurge, NULL);
b84a3a96
CH
228}
229
1da177e4
LT
230/*
231 * Just destroy the quotainfo structure.
232 */
233void
7d095257
CH
234xfs_qm_unmount(
235 struct xfs_mount *mp)
1da177e4 236{
7d095257 237 if (mp->m_quotainfo) {
8112e9dc 238 xfs_qm_dqpurge_all(mp, XFS_QMOPT_QUOTALL);
1da177e4 239 xfs_qm_destroy_quotainfo(mp);
7d095257 240 }
1da177e4
LT
241}
242
243
244/*
245 * This is called from xfs_mountfs to start quotas and initialize all
246 * necessary data structures like quotainfo. This is also responsible for
247 * running a quotacheck as necessary. We are guaranteed that the superblock
248 * is consistently read in at this point.
53aa7915
DC
249 *
250 * If we fail here, the mount will continue with quota turned off. We don't
251 * need to inidicate success or failure at all.
1da177e4 252 */
53aa7915 253void
1da177e4 254xfs_qm_mount_quotas(
4249023a 255 xfs_mount_t *mp)
1da177e4 256{
1da177e4
LT
257 int error = 0;
258 uint sbf;
259
1da177e4
LT
260 /*
261 * If quotas on realtime volumes is not supported, we disable
262 * quotas immediately.
263 */
264 if (mp->m_sb.sb_rextents) {
0b932ccc 265 xfs_notice(mp, "Cannot turn on quotas for realtime filesystem");
1da177e4
LT
266 mp->m_qflags = 0;
267 goto write_changes;
268 }
269
1da177e4 270 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
155ffd07 271
1da177e4
LT
272 /*
273 * Allocate the quotainfo structure inside the mount struct, and
274 * create quotainode(s), and change/rev superblock if necessary.
275 */
53aa7915
DC
276 error = xfs_qm_init_quotainfo(mp);
277 if (error) {
1da177e4
LT
278 /*
279 * We must turn off quotas.
280 */
281 ASSERT(mp->m_quotainfo == NULL);
282 mp->m_qflags = 0;
283 goto write_changes;
284 }
285 /*
286 * If any of the quotas are not consistent, do a quotacheck.
287 */
4249023a 288 if (XFS_QM_NEED_QUOTACHECK(mp)) {
53aa7915
DC
289 error = xfs_qm_quotacheck(mp);
290 if (error) {
291 /* Quotacheck failed and disabled quotas. */
292 return;
1da177e4 293 }
1da177e4 294 }
646d5bda
DD
295 /*
296 * If one type of quotas is off, then it will lose its
297 * quotachecked status, since we won't be doing accounting for
298 * that type anymore.
299 */
53aa7915 300 if (!XFS_IS_UQUOTA_ON(mp))
646d5bda 301 mp->m_qflags &= ~XFS_UQUOTA_CHKD;
53aa7915 302 if (!(XFS_IS_GQUOTA_ON(mp) || XFS_IS_PQUOTA_ON(mp)))
646d5bda 303 mp->m_qflags &= ~XFS_OQUOTA_CHKD;
155ffd07 304
1da177e4
LT
305 write_changes:
306 /*
3685c2a1 307 * We actually don't have to acquire the m_sb_lock at all.
1da177e4
LT
308 * This can only be called from mount, and that's single threaded. XXX
309 */
3685c2a1 310 spin_lock(&mp->m_sb_lock);
1da177e4
LT
311 sbf = mp->m_sb.sb_qflags;
312 mp->m_sb.sb_qflags = mp->m_qflags & XFS_MOUNT_QUOTA_ALL;
3685c2a1 313 spin_unlock(&mp->m_sb_lock);
1da177e4
LT
314
315 if (sbf != (mp->m_qflags & XFS_MOUNT_QUOTA_ALL)) {
316 if (xfs_qm_write_sb_changes(mp, XFS_SB_QFLAGS)) {
317 /*
318 * We could only have been turning quotas off.
319 * We aren't in very good shape actually because
320 * the incore structures are convinced that quotas are
321 * off, but the on disk superblock doesn't know that !
322 */
323 ASSERT(!(XFS_IS_QUOTA_RUNNING(mp)));
53487786
DC
324 xfs_alert(mp, "%s: Superblock update failed!",
325 __func__);
1da177e4
LT
326 }
327 }
328
329 if (error) {
53487786 330 xfs_warn(mp, "Failed to initialize disk quotas.");
7d095257 331 return;
1da177e4 332 }
1da177e4
LT
333}
334
335/*
336 * Called from the vfsops layer.
337 */
e57481dc 338void
1da177e4
LT
339xfs_qm_unmount_quotas(
340 xfs_mount_t *mp)
341{
1da177e4
LT
342 /*
343 * Release the dquots that root inode, et al might be holding,
344 * before we flush quotas and blow away the quotainfo structure.
345 */
346 ASSERT(mp->m_rootip);
347 xfs_qm_dqdetach(mp->m_rootip);
348 if (mp->m_rbmip)
349 xfs_qm_dqdetach(mp->m_rbmip);
350 if (mp->m_rsumip)
351 xfs_qm_dqdetach(mp->m_rsumip);
352
353 /*
e57481dc 354 * Release the quota inodes.
1da177e4 355 */
1da177e4 356 if (mp->m_quotainfo) {
e57481dc
CH
357 if (mp->m_quotainfo->qi_uquotaip) {
358 IRELE(mp->m_quotainfo->qi_uquotaip);
359 mp->m_quotainfo->qi_uquotaip = NULL;
1da177e4 360 }
e57481dc
CH
361 if (mp->m_quotainfo->qi_gquotaip) {
362 IRELE(mp->m_quotainfo->qi_gquotaip);
363 mp->m_quotainfo->qi_gquotaip = NULL;
1da177e4
LT
364 }
365 }
1da177e4
LT
366}
367
1da177e4
LT
368STATIC int
369xfs_qm_dqattach_one(
370 xfs_inode_t *ip,
371 xfs_dqid_t id,
372 uint type,
373 uint doalloc,
1da177e4
LT
374 xfs_dquot_t *udqhint, /* hint */
375 xfs_dquot_t **IO_idqpp)
376{
377 xfs_dquot_t *dqp;
378 int error;
379
579aa9ca 380 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4 381 error = 0;
8e9b6e7f 382
1da177e4
LT
383 /*
384 * See if we already have it in the inode itself. IO_idqpp is
385 * &i_udquot or &i_gdquot. This made the code look weird, but
386 * made the logic a lot simpler.
387 */
8e9b6e7f
CH
388 dqp = *IO_idqpp;
389 if (dqp) {
0b1b213f 390 trace_xfs_dqattach_found(dqp);
8e9b6e7f 391 return 0;
1da177e4
LT
392 }
393
394 /*
395 * udqhint is the i_udquot field in inode, and is non-NULL only
c8ad20ff 396 * when the type arg is group/project. Its purpose is to save a
1da177e4
LT
397 * lookup by dqid (xfs_qm_dqget) by caching a group dquot inside
398 * the user dquot.
399 */
8e9b6e7f
CH
400 if (udqhint) {
401 ASSERT(type == XFS_DQ_GROUP || type == XFS_DQ_PROJ);
1da177e4
LT
402 xfs_dqlock(udqhint);
403
8e9b6e7f
CH
404 /*
405 * No need to take dqlock to look at the id.
406 *
407 * The ID can't change until it gets reclaimed, and it won't
408 * be reclaimed as long as we have a ref from inode and we
409 * hold the ilock.
410 */
411 dqp = udqhint->q_gdquot;
412 if (dqp && be32_to_cpu(dqp->q_core.d_id) == id) {
8e9b6e7f 413 ASSERT(*IO_idqpp == NULL);
8e9b6e7f 414
78e55892 415 *IO_idqpp = xfs_qm_dqhold(dqp);
1da177e4 416 xfs_dqunlock(udqhint);
8e9b6e7f 417 return 0;
1da177e4 418 }
8e9b6e7f
CH
419
420 /*
421 * We can't hold a dquot lock when we call the dqget code.
422 * We'll deadlock in no time, because of (not conforming to)
423 * lock ordering - the inodelock comes before any dquot lock,
424 * and we may drop and reacquire the ilock in xfs_qm_dqget().
425 */
1da177e4 426 xfs_dqunlock(udqhint);
8e9b6e7f
CH
427 }
428
1da177e4
LT
429 /*
430 * Find the dquot from somewhere. This bumps the
431 * reference count of dquot and returns it locked.
432 * This can return ENOENT if dquot didn't exist on
433 * disk and we didn't ask it to allocate;
434 * ESRCH if quotas got turned off suddenly.
435 */
db3e74b5
MH
436 error = xfs_qm_dqget(ip->i_mount, ip, id, type,
437 doalloc | XFS_QMOPT_DOWARN, &dqp);
8e9b6e7f
CH
438 if (error)
439 return error;
1da177e4 440
0b1b213f 441 trace_xfs_dqattach_get(dqp);
8e9b6e7f 442
1da177e4
LT
443 /*
444 * dqget may have dropped and re-acquired the ilock, but it guarantees
445 * that the dquot returned is the one that should go in the inode.
446 */
447 *IO_idqpp = dqp;
8e9b6e7f
CH
448 xfs_dqunlock(dqp);
449 return 0;
1da177e4
LT
450}
451
452
453/*
454 * Given a udquot and gdquot, attach a ptr to the group dquot in the
ab680bb7 455 * udquot as a hint for future lookups.
1da177e4
LT
456 */
457STATIC void
458xfs_qm_dqattach_grouphint(
459 xfs_dquot_t *udq,
8e9b6e7f 460 xfs_dquot_t *gdq)
1da177e4
LT
461{
462 xfs_dquot_t *tmp;
463
8e9b6e7f 464 xfs_dqlock(udq);
1da177e4 465
ab680bb7
CH
466 tmp = udq->q_gdquot;
467 if (tmp) {
468 if (tmp == gdq)
469 goto done;
1da177e4
LT
470
471 udq->q_gdquot = NULL;
1da177e4 472 xfs_qm_dqrele(tmp);
1da177e4 473 }
8e9b6e7f 474
78e55892 475 udq->q_gdquot = xfs_qm_dqhold(gdq);
ab680bb7 476done:
8e9b6e7f 477 xfs_dqunlock(udq);
1da177e4
LT
478}
479
b4d05e30
CH
480static bool
481xfs_qm_need_dqattach(
482 struct xfs_inode *ip)
483{
484 struct xfs_mount *mp = ip->i_mount;
485
486 if (!XFS_IS_QUOTA_RUNNING(mp))
487 return false;
488 if (!XFS_IS_QUOTA_ON(mp))
489 return false;
490 if (!XFS_NOT_DQATTACHED(mp, ip))
491 return false;
9cad19d2 492 if (xfs_is_quota_inode(&mp->m_sb, ip->i_ino))
b4d05e30
CH
493 return false;
494 return true;
495}
1da177e4
LT
496
497/*
c8ad20ff
NS
498 * Given a locked inode, attach dquot(s) to it, taking U/G/P-QUOTAON
499 * into account.
1da177e4 500 * If XFS_QMOPT_DQALLOC, the dquot(s) will be allocated if needed.
1da177e4
LT
501 * Inode may get unlocked and relocked in here, and the caller must deal with
502 * the consequences.
503 */
504int
7d095257 505xfs_qm_dqattach_locked(
1da177e4
LT
506 xfs_inode_t *ip,
507 uint flags)
508{
509 xfs_mount_t *mp = ip->i_mount;
510 uint nquotas = 0;
511 int error = 0;
512
b4d05e30 513 if (!xfs_qm_need_dqattach(ip))
014c2544 514 return 0;
1da177e4 515
7d095257 516 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
517
518 if (XFS_IS_UQUOTA_ON(mp)) {
519 error = xfs_qm_dqattach_one(ip, ip->i_d.di_uid, XFS_DQ_USER,
520 flags & XFS_QMOPT_DQALLOC,
1da177e4
LT
521 NULL, &ip->i_udquot);
522 if (error)
523 goto done;
524 nquotas++;
525 }
579aa9ca
CH
526
527 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
c8ad20ff
NS
528 if (XFS_IS_OQUOTA_ON(mp)) {
529 error = XFS_IS_GQUOTA_ON(mp) ?
530 xfs_qm_dqattach_one(ip, ip->i_d.di_gid, XFS_DQ_GROUP,
531 flags & XFS_QMOPT_DQALLOC,
c8ad20ff 532 ip->i_udquot, &ip->i_gdquot) :
6743099c 533 xfs_qm_dqattach_one(ip, xfs_get_projid(ip), XFS_DQ_PROJ,
1da177e4 534 flags & XFS_QMOPT_DQALLOC,
1da177e4
LT
535 ip->i_udquot, &ip->i_gdquot);
536 /*
537 * Don't worry about the udquot that we may have
538 * attached above. It'll get detached, if not already.
539 */
540 if (error)
541 goto done;
542 nquotas++;
543 }
544
545 /*
546 * Attach this group quota to the user quota as a hint.
547 * This WON'T, in general, result in a thrash.
548 */
549 if (nquotas == 2) {
579aa9ca 550 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
551 ASSERT(ip->i_udquot);
552 ASSERT(ip->i_gdquot);
553
554 /*
ab680bb7
CH
555 * We do not have i_udquot locked at this point, but this check
556 * is OK since we don't depend on the i_gdquot to be accurate
557 * 100% all the time. It is just a hint, and this will
558 * succeed in general.
1da177e4 559 */
ab680bb7
CH
560 if (ip->i_udquot->q_gdquot != ip->i_gdquot)
561 xfs_qm_dqattach_grouphint(ip->i_udquot, ip->i_gdquot);
1da177e4
LT
562 }
563
7d095257 564 done:
ea15ab3c
CH
565#ifdef DEBUG
566 if (!error) {
1da177e4
LT
567 if (XFS_IS_UQUOTA_ON(mp))
568 ASSERT(ip->i_udquot);
c8ad20ff 569 if (XFS_IS_OQUOTA_ON(mp))
1da177e4
LT
570 ASSERT(ip->i_gdquot);
571 }
7d095257 572 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4 573#endif
7d095257
CH
574 return error;
575}
1da177e4 576
7d095257
CH
577int
578xfs_qm_dqattach(
579 struct xfs_inode *ip,
580 uint flags)
581{
582 int error;
583
b4d05e30
CH
584 if (!xfs_qm_need_dqattach(ip))
585 return 0;
586
7d095257
CH
587 xfs_ilock(ip, XFS_ILOCK_EXCL);
588 error = xfs_qm_dqattach_locked(ip, flags);
589 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1da177e4 590
014c2544 591 return error;
1da177e4
LT
592}
593
594/*
595 * Release dquots (and their references) if any.
596 * The inode should be locked EXCL except when this's called by
597 * xfs_ireclaim.
598 */
599void
600xfs_qm_dqdetach(
601 xfs_inode_t *ip)
602{
603 if (!(ip->i_udquot || ip->i_gdquot))
604 return;
605
0b1b213f
CH
606 trace_xfs_dquot_dqdetach(ip);
607
9cad19d2 608 ASSERT(!xfs_is_quota_inode(&ip->i_mount->m_sb, ip->i_ino));
1da177e4
LT
609 if (ip->i_udquot) {
610 xfs_qm_dqrele(ip->i_udquot);
611 ip->i_udquot = NULL;
612 }
613 if (ip->i_gdquot) {
614 xfs_qm_dqrele(ip->i_gdquot);
615 ip->i_gdquot = NULL;
616 }
617}
618
3fe58f30
CH
619int
620xfs_qm_calc_dquots_per_chunk(
621 struct xfs_mount *mp,
622 unsigned int nbblks) /* basic block units */
623{
624 unsigned int ndquots;
625
626 ASSERT(nbblks > 0);
627 ndquots = BBTOB(nbblks);
628 do_div(ndquots, sizeof(xfs_dqblk_t));
629
630 return ndquots;
631}
632
1da177e4
LT
633/*
634 * This initializes all the quota information that's kept in the
635 * mount structure
636 */
ba0f32d4 637STATIC int
1da177e4
LT
638xfs_qm_init_quotainfo(
639 xfs_mount_t *mp)
640{
641 xfs_quotainfo_t *qinf;
642 int error;
643 xfs_dquot_t *dqp;
644
645 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
646
1da177e4
LT
647 qinf = mp->m_quotainfo = kmem_zalloc(sizeof(xfs_quotainfo_t), KM_SLEEP);
648
649 /*
650 * See if quotainodes are setup, and if not, allocate them,
651 * and change the superblock accordingly.
652 */
653 if ((error = xfs_qm_init_quotainos(mp))) {
f0e2d93c 654 kmem_free(qinf);
1da177e4 655 mp->m_quotainfo = NULL;
014c2544 656 return error;
1da177e4
LT
657 }
658
9f920f11
CH
659 INIT_RADIX_TREE(&qinf->qi_uquota_tree, GFP_NOFS);
660 INIT_RADIX_TREE(&qinf->qi_gquota_tree, GFP_NOFS);
661 mutex_init(&qinf->qi_tree_lock);
662
f8739c3c
CH
663 INIT_LIST_HEAD(&qinf->qi_lru_list);
664 qinf->qi_lru_count = 0;
665 mutex_init(&qinf->qi_lru_lock);
666
1da177e4 667 /* mutex used to serialize quotaoffs */
794ee1ba 668 mutex_init(&qinf->qi_quotaofflock);
1da177e4
LT
669
670 /* Precalc some constants */
671 qinf->qi_dqchunklen = XFS_FSB_TO_BB(mp, XFS_DQUOT_CLUSTER_SIZE_FSB);
3fe58f30
CH
672 qinf->qi_dqperchunk = xfs_qm_calc_dquots_per_chunk(mp,
673 qinf->qi_dqchunklen);
1da177e4
LT
674
675 mp->m_qflags |= (mp->m_sb.sb_qflags & XFS_ALL_QUOTA_CHKD);
676
677 /*
678 * We try to get the limits from the superuser's limits fields.
679 * This is quite hacky, but it is standard quota practice.
7ae44407 680 *
1da177e4
LT
681 * We look at the USR dquot with id == 0 first, but if user quotas
682 * are not enabled we goto the GRP dquot with id == 0.
683 * We don't really care to keep separate default limits for user
684 * and group quotas, at least not at this point.
7ae44407
CH
685 *
686 * Since we may not have done a quotacheck by this point, just read
687 * the dquot without attaching it to any hashtables or lists.
1da177e4 688 */
7ae44407
CH
689 error = xfs_qm_dqread(mp, 0,
690 XFS_IS_UQUOTA_RUNNING(mp) ? XFS_DQ_USER :
691 (XFS_IS_GQUOTA_RUNNING(mp) ? XFS_DQ_GROUP :
692 XFS_DQ_PROJ),
693 XFS_QMOPT_DOWARN, &dqp);
694 if (!error) {
1da177e4
LT
695 xfs_disk_dquot_t *ddqp = &dqp->q_core;
696
697 /*
698 * The warnings and timers set the grace period given to
699 * a user or group before he or she can not perform any
700 * more writing. If it is zero, a default is used.
701 */
1149d96a
CH
702 qinf->qi_btimelimit = ddqp->d_btimer ?
703 be32_to_cpu(ddqp->d_btimer) : XFS_QM_BTIMELIMIT;
704 qinf->qi_itimelimit = ddqp->d_itimer ?
705 be32_to_cpu(ddqp->d_itimer) : XFS_QM_ITIMELIMIT;
706 qinf->qi_rtbtimelimit = ddqp->d_rtbtimer ?
707 be32_to_cpu(ddqp->d_rtbtimer) : XFS_QM_RTBTIMELIMIT;
708 qinf->qi_bwarnlimit = ddqp->d_bwarns ?
709 be16_to_cpu(ddqp->d_bwarns) : XFS_QM_BWARNLIMIT;
710 qinf->qi_iwarnlimit = ddqp->d_iwarns ?
711 be16_to_cpu(ddqp->d_iwarns) : XFS_QM_IWARNLIMIT;
712 qinf->qi_rtbwarnlimit = ddqp->d_rtbwarns ?
713 be16_to_cpu(ddqp->d_rtbwarns) : XFS_QM_RTBWARNLIMIT;
714 qinf->qi_bhardlimit = be64_to_cpu(ddqp->d_blk_hardlimit);
715 qinf->qi_bsoftlimit = be64_to_cpu(ddqp->d_blk_softlimit);
716 qinf->qi_ihardlimit = be64_to_cpu(ddqp->d_ino_hardlimit);
717 qinf->qi_isoftlimit = be64_to_cpu(ddqp->d_ino_softlimit);
718 qinf->qi_rtbhardlimit = be64_to_cpu(ddqp->d_rtb_hardlimit);
719 qinf->qi_rtbsoftlimit = be64_to_cpu(ddqp->d_rtb_softlimit);
1da177e4 720
1da177e4
LT
721 xfs_qm_dqdestroy(dqp);
722 } else {
723 qinf->qi_btimelimit = XFS_QM_BTIMELIMIT;
724 qinf->qi_itimelimit = XFS_QM_ITIMELIMIT;
725 qinf->qi_rtbtimelimit = XFS_QM_RTBTIMELIMIT;
726 qinf->qi_bwarnlimit = XFS_QM_BWARNLIMIT;
727 qinf->qi_iwarnlimit = XFS_QM_IWARNLIMIT;
06d10dd9 728 qinf->qi_rtbwarnlimit = XFS_QM_RTBWARNLIMIT;
1da177e4
LT
729 }
730
f8739c3c
CH
731 qinf->qi_shrinker.shrink = xfs_qm_shake;
732 qinf->qi_shrinker.seeks = DEFAULT_SEEKS;
733 register_shrinker(&qinf->qi_shrinker);
014c2544 734 return 0;
1da177e4
LT
735}
736
737
738/*
739 * Gets called when unmounting a filesystem or when all quotas get
740 * turned off.
741 * This purges the quota inodes, destroys locks and frees itself.
742 */
743void
744xfs_qm_destroy_quotainfo(
745 xfs_mount_t *mp)
746{
747 xfs_quotainfo_t *qi;
748
749 qi = mp->m_quotainfo;
750 ASSERT(qi != NULL);
1da177e4 751
f8739c3c
CH
752 unregister_shrinker(&qi->qi_shrinker);
753
1da177e4 754 if (qi->qi_uquotaip) {
26cc0021 755 IRELE(qi->qi_uquotaip);
1da177e4
LT
756 qi->qi_uquotaip = NULL; /* paranoia */
757 }
758 if (qi->qi_gquotaip) {
26cc0021 759 IRELE(qi->qi_gquotaip);
1da177e4
LT
760 qi->qi_gquotaip = NULL;
761 }
762 mutex_destroy(&qi->qi_quotaofflock);
f0e2d93c 763 kmem_free(qi);
1da177e4
LT
764 mp->m_quotainfo = NULL;
765}
766
1da177e4
LT
767/*
768 * Create an inode and return with a reference already taken, but unlocked
769 * This is how we create quota inodes
770 */
771STATIC int
772xfs_qm_qino_alloc(
773 xfs_mount_t *mp,
774 xfs_inode_t **ip,
775 __int64_t sbfields,
776 uint flags)
777{
778 xfs_trans_t *tp;
779 int error;
1da177e4
LT
780 int committed;
781
061f7209 782 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_QINOCREATE);
1da177e4
LT
783 if ((error = xfs_trans_reserve(tp,
784 XFS_QM_QINOCREATE_SPACE_RES(mp),
785 XFS_CREATE_LOG_RES(mp), 0,
786 XFS_TRANS_PERM_LOG_RES,
787 XFS_CREATE_LOG_COUNT))) {
788 xfs_trans_cancel(tp, 0);
014c2544 789 return error;
1da177e4 790 }
1da177e4 791
6c77b0ea
CH
792 error = xfs_dir_ialloc(&tp, NULL, S_IFREG, 1, 0, 0, 1, ip, &committed);
793 if (error) {
1da177e4
LT
794 xfs_trans_cancel(tp, XFS_TRANS_RELEASE_LOG_RES |
795 XFS_TRANS_ABORT);
014c2544 796 return error;
1da177e4
LT
797 }
798
1da177e4
LT
799 /*
800 * Make the changes in the superblock, and log those too.
801 * sbfields arg may contain fields other than *QUOTINO;
802 * VERSIONNUM for example.
803 */
3685c2a1 804 spin_lock(&mp->m_sb_lock);
1da177e4 805 if (flags & XFS_QMOPT_SBVERSION) {
62118709 806 ASSERT(!xfs_sb_version_hasquota(&mp->m_sb));
1da177e4
LT
807 ASSERT((sbfields & (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
808 XFS_SB_GQUOTINO | XFS_SB_QFLAGS)) ==
809 (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
810 XFS_SB_GQUOTINO | XFS_SB_QFLAGS));
811
62118709 812 xfs_sb_version_addquota(&mp->m_sb);
1da177e4
LT
813 mp->m_sb.sb_uquotino = NULLFSINO;
814 mp->m_sb.sb_gquotino = NULLFSINO;
815
816 /* qflags will get updated _after_ quotacheck */
817 mp->m_sb.sb_qflags = 0;
1da177e4
LT
818 }
819 if (flags & XFS_QMOPT_UQUOTA)
820 mp->m_sb.sb_uquotino = (*ip)->i_ino;
821 else
822 mp->m_sb.sb_gquotino = (*ip)->i_ino;
3685c2a1 823 spin_unlock(&mp->m_sb_lock);
1da177e4
LT
824 xfs_mod_sb(tp, sbfields);
825
1c72bf90 826 if ((error = xfs_trans_commit(tp, XFS_TRANS_RELEASE_LOG_RES))) {
53487786 827 xfs_alert(mp, "%s failed (error %d)!", __func__, error);
014c2544 828 return error;
1da177e4 829 }
014c2544 830 return 0;
1da177e4
LT
831}
832
833
5b139738 834STATIC void
1da177e4
LT
835xfs_qm_reset_dqcounts(
836 xfs_mount_t *mp,
837 xfs_buf_t *bp,
838 xfs_dqid_t id,
839 uint type)
840{
6fcdc59d 841 struct xfs_dqblk *dqb;
1da177e4
LT
842 int j;
843
0b1b213f
CH
844 trace_xfs_reset_dqcounts(bp, _RET_IP_);
845
1da177e4
LT
846 /*
847 * Reset all counters and timers. They'll be
848 * started afresh by xfs_qm_quotacheck.
849 */
850#ifdef DEBUG
851 j = XFS_FSB_TO_B(mp, XFS_DQUOT_CLUSTER_SIZE_FSB);
852 do_div(j, sizeof(xfs_dqblk_t));
8a7b8a89 853 ASSERT(mp->m_quotainfo->qi_dqperchunk == j);
1da177e4 854#endif
6fcdc59d 855 dqb = bp->b_addr;
8a7b8a89 856 for (j = 0; j < mp->m_quotainfo->qi_dqperchunk; j++) {
6fcdc59d
DC
857 struct xfs_disk_dquot *ddq;
858
859 ddq = (struct xfs_disk_dquot *)&dqb[j];
860
1da177e4
LT
861 /*
862 * Do a sanity check, and if needed, repair the dqblk. Don't
863 * output any warnings because it's perfectly possible to
c41564b5 864 * find uninitialised dquot blks. See comment in xfs_qm_dqcheck.
1da177e4 865 */
a0fa2b67 866 (void) xfs_qm_dqcheck(mp, ddq, id+j, type, XFS_QMOPT_DQREPAIR,
1da177e4 867 "xfs_quotacheck");
1149d96a
CH
868 ddq->d_bcount = 0;
869 ddq->d_icount = 0;
870 ddq->d_rtbcount = 0;
871 ddq->d_btimer = 0;
872 ddq->d_itimer = 0;
873 ddq->d_rtbtimer = 0;
874 ddq->d_bwarns = 0;
875 ddq->d_iwarns = 0;
876 ddq->d_rtbwarns = 0;
6fcdc59d
DC
877
878 if (xfs_sb_version_hascrc(&mp->m_sb)) {
879 xfs_update_cksum((char *)&dqb[j],
880 sizeof(struct xfs_dqblk),
881 XFS_DQUOT_CRC_OFF);
882 }
1da177e4 883 }
1da177e4
LT
884}
885
886STATIC int
887xfs_qm_dqiter_bufs(
43ff2122
CH
888 struct xfs_mount *mp,
889 xfs_dqid_t firstid,
890 xfs_fsblock_t bno,
891 xfs_filblks_t blkcnt,
892 uint flags,
893 struct list_head *buffer_list)
1da177e4 894{
43ff2122
CH
895 struct xfs_buf *bp;
896 int error;
897 int type;
1da177e4
LT
898
899 ASSERT(blkcnt > 0);
c8ad20ff
NS
900 type = flags & XFS_QMOPT_UQUOTA ? XFS_DQ_USER :
901 (flags & XFS_QMOPT_PQUOTA ? XFS_DQ_PROJ : XFS_DQ_GROUP);
1da177e4
LT
902 error = 0;
903
904 /*
905 * Blkcnt arg can be a very big number, and might even be
906 * larger than the log itself. So, we have to break it up into
907 * manageable-sized transactions.
908 * Note that we don't start a permanent transaction here; we might
909 * not be able to get a log reservation for the whole thing up front,
910 * and we don't really care to either, because we just discard
911 * everything if we were to crash in the middle of this loop.
912 */
913 while (blkcnt--) {
914 error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp,
915 XFS_FSB_TO_DADDR(mp, bno),
c6319198 916 mp->m_quotainfo->qi_dqchunklen, 0, &bp,
1813dd64 917 &xfs_dquot_buf_ops);
1da177e4 918
3fe58f30 919 /*
6fcdc59d
DC
920 * CRC and validation errors will return a EFSCORRUPTED here. If
921 * this occurs, re-read without CRC validation so that we can
922 * repair the damage via xfs_qm_reset_dqcounts(). This process
923 * will leave a trace in the log indicating corruption has
924 * been detected.
3fe58f30 925 */
6fcdc59d
DC
926 if (error == EFSCORRUPTED) {
927 error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp,
928 XFS_FSB_TO_DADDR(mp, bno),
929 mp->m_quotainfo->qi_dqchunklen, 0, &bp,
930 NULL);
931 }
932
933 if (error)
934 break;
935
5b139738 936 xfs_qm_reset_dqcounts(mp, bp, firstid, type);
43ff2122 937 xfs_buf_delwri_queue(bp, buffer_list);
61551f1e 938 xfs_buf_relse(bp);
6fcdc59d
DC
939
940 /* goto the next block. */
1da177e4 941 bno++;
8a7b8a89 942 firstid += mp->m_quotainfo->qi_dqperchunk;
1da177e4 943 }
43ff2122 944
014c2544 945 return error;
1da177e4
LT
946}
947
948/*
c8ad20ff 949 * Iterate over all allocated USR/GRP/PRJ dquots in the system, calling a
1da177e4
LT
950 * caller supplied function for every chunk of dquots that we find.
951 */
952STATIC int
953xfs_qm_dqiterate(
43ff2122
CH
954 struct xfs_mount *mp,
955 struct xfs_inode *qip,
956 uint flags,
957 struct list_head *buffer_list)
1da177e4 958{
43ff2122 959 struct xfs_bmbt_irec *map;
1da177e4
LT
960 int i, nmaps; /* number of map entries */
961 int error; /* return value */
962 xfs_fileoff_t lblkno;
963 xfs_filblks_t maxlblkcnt;
964 xfs_dqid_t firstid;
965 xfs_fsblock_t rablkno;
966 xfs_filblks_t rablkcnt;
967
968 error = 0;
969 /*
c41564b5 970 * This looks racy, but we can't keep an inode lock across a
1da177e4
LT
971 * trans_reserve. But, this gets called during quotacheck, and that
972 * happens only at mount time which is single threaded.
973 */
974 if (qip->i_d.di_nblocks == 0)
014c2544 975 return 0;
1da177e4
LT
976
977 map = kmem_alloc(XFS_DQITER_MAP_SIZE * sizeof(*map), KM_SLEEP);
978
979 lblkno = 0;
32972383 980 maxlblkcnt = XFS_B_TO_FSB(mp, mp->m_super->s_maxbytes);
1da177e4
LT
981 do {
982 nmaps = XFS_DQITER_MAP_SIZE;
983 /*
984 * We aren't changing the inode itself. Just changing
985 * some of its data. No new blocks are added here, and
986 * the inode is never added to the transaction.
987 */
988 xfs_ilock(qip, XFS_ILOCK_SHARED);
5c8ed202
DC
989 error = xfs_bmapi_read(qip, lblkno, maxlblkcnt - lblkno,
990 map, &nmaps, 0);
1da177e4
LT
991 xfs_iunlock(qip, XFS_ILOCK_SHARED);
992 if (error)
993 break;
994
995 ASSERT(nmaps <= XFS_DQITER_MAP_SIZE);
996 for (i = 0; i < nmaps; i++) {
997 ASSERT(map[i].br_startblock != DELAYSTARTBLOCK);
998 ASSERT(map[i].br_blockcount);
999
1000
1001 lblkno += map[i].br_blockcount;
1002
1003 if (map[i].br_startblock == HOLESTARTBLOCK)
1004 continue;
1005
1006 firstid = (xfs_dqid_t) map[i].br_startoff *
8a7b8a89 1007 mp->m_quotainfo->qi_dqperchunk;
1da177e4
LT
1008 /*
1009 * Do a read-ahead on the next extent.
1010 */
1011 if ((i+1 < nmaps) &&
1012 (map[i+1].br_startblock != HOLESTARTBLOCK)) {
1013 rablkcnt = map[i+1].br_blockcount;
1014 rablkno = map[i+1].br_startblock;
1015 while (rablkcnt--) {
1a1a3e97 1016 xfs_buf_readahead(mp->m_ddev_targp,
1da177e4 1017 XFS_FSB_TO_DADDR(mp, rablkno),
c3f8fc73
DC
1018 mp->m_quotainfo->qi_dqchunklen,
1019 NULL);
1da177e4
LT
1020 rablkno++;
1021 }
1022 }
1023 /*
1024 * Iterate thru all the blks in the extent and
1025 * reset the counters of all the dquots inside them.
1026 */
43ff2122
CH
1027 error = xfs_qm_dqiter_bufs(mp, firstid,
1028 map[i].br_startblock,
1029 map[i].br_blockcount,
1030 flags, buffer_list);
1031 if (error)
1032 goto out;
1da177e4 1033 }
1da177e4
LT
1034 } while (nmaps > 0);
1035
43ff2122 1036out:
f0e2d93c 1037 kmem_free(map);
014c2544 1038 return error;
1da177e4
LT
1039}
1040
1041/*
1042 * Called by dqusage_adjust in doing a quotacheck.
52fda114
CH
1043 *
1044 * Given the inode, and a dquot id this updates both the incore dqout as well
1045 * as the buffer copy. This is so that once the quotacheck is done, we can
1046 * just log all the buffers, as opposed to logging numerous updates to
1047 * individual dquots.
1da177e4 1048 */
52fda114 1049STATIC int
1da177e4 1050xfs_qm_quotacheck_dqadjust(
52fda114
CH
1051 struct xfs_inode *ip,
1052 xfs_dqid_t id,
1053 uint type,
1da177e4
LT
1054 xfs_qcnt_t nblks,
1055 xfs_qcnt_t rtblks)
1056{
52fda114
CH
1057 struct xfs_mount *mp = ip->i_mount;
1058 struct xfs_dquot *dqp;
1059 int error;
1060
1061 error = xfs_qm_dqget(mp, ip, id, type,
1062 XFS_QMOPT_DQALLOC | XFS_QMOPT_DOWARN, &dqp);
1063 if (error) {
1064 /*
1065 * Shouldn't be able to turn off quotas here.
1066 */
1067 ASSERT(error != ESRCH);
1068 ASSERT(error != ENOENT);
1069 return error;
1070 }
0b1b213f
CH
1071
1072 trace_xfs_dqadjust(dqp);
1073
1da177e4
LT
1074 /*
1075 * Adjust the inode count and the block count to reflect this inode's
1076 * resource usage.
1077 */
413d57c9 1078 be64_add_cpu(&dqp->q_core.d_icount, 1);
1da177e4
LT
1079 dqp->q_res_icount++;
1080 if (nblks) {
413d57c9 1081 be64_add_cpu(&dqp->q_core.d_bcount, nblks);
1da177e4
LT
1082 dqp->q_res_bcount += nblks;
1083 }
1084 if (rtblks) {
413d57c9 1085 be64_add_cpu(&dqp->q_core.d_rtbcount, rtblks);
1da177e4
LT
1086 dqp->q_res_rtbcount += rtblks;
1087 }
1088
1089 /*
1090 * Set default limits, adjust timers (since we changed usages)
191f8488
CH
1091 *
1092 * There are no timers for the default values set in the root dquot.
1da177e4 1093 */
191f8488 1094 if (dqp->q_core.d_id) {
4b6eae2e 1095 xfs_qm_adjust_dqlimits(mp, dqp);
52fda114 1096 xfs_qm_adjust_dqtimers(mp, &dqp->q_core);
1da177e4
LT
1097 }
1098
1099 dqp->dq_flags |= XFS_DQ_DIRTY;
52fda114
CH
1100 xfs_qm_dqput(dqp);
1101 return 0;
1da177e4
LT
1102}
1103
1104STATIC int
1105xfs_qm_get_rtblks(
1106 xfs_inode_t *ip,
1107 xfs_qcnt_t *O_rtblks)
1108{
1109 xfs_filblks_t rtblks; /* total rt blks */
4eea22f0 1110 xfs_extnum_t idx; /* extent record index */
1da177e4
LT
1111 xfs_ifork_t *ifp; /* inode fork pointer */
1112 xfs_extnum_t nextents; /* number of extent entries */
1da177e4
LT
1113 int error;
1114
1115 ASSERT(XFS_IS_REALTIME_INODE(ip));
1116 ifp = XFS_IFORK_PTR(ip, XFS_DATA_FORK);
1117 if (!(ifp->if_flags & XFS_IFEXTENTS)) {
1118 if ((error = xfs_iread_extents(NULL, ip, XFS_DATA_FORK)))
014c2544 1119 return error;
1da177e4
LT
1120 }
1121 rtblks = 0;
4eea22f0 1122 nextents = ifp->if_bytes / (uint)sizeof(xfs_bmbt_rec_t);
a6f64d4a
CH
1123 for (idx = 0; idx < nextents; idx++)
1124 rtblks += xfs_bmbt_get_blockcount(xfs_iext_get_ext(ifp, idx));
1da177e4 1125 *O_rtblks = (xfs_qcnt_t)rtblks;
014c2544 1126 return 0;
1da177e4
LT
1127}
1128
1129/*
1130 * callback routine supplied to bulkstat(). Given an inumber, find its
1131 * dquots and update them to account for resources taken by that inode.
1132 */
1133/* ARGSUSED */
1134STATIC int
1135xfs_qm_dqusage_adjust(
1136 xfs_mount_t *mp, /* mount point for filesystem */
1137 xfs_ino_t ino, /* inode number to get data for */
1138 void __user *buffer, /* not used */
1139 int ubsize, /* not used */
1da177e4 1140 int *ubused, /* not used */
1da177e4
LT
1141 int *res) /* result code value */
1142{
1143 xfs_inode_t *ip;
52fda114 1144 xfs_qcnt_t nblks, rtblks = 0;
1da177e4
LT
1145 int error;
1146
1147 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1148
1149 /*
1150 * rootino must have its resources accounted for, not so with the quota
1151 * inodes.
1152 */
9cad19d2 1153 if (xfs_is_quota_inode(&mp->m_sb, ino)) {
1da177e4
LT
1154 *res = BULKSTAT_RV_NOTHING;
1155 return XFS_ERROR(EINVAL);
1156 }
1157
1158 /*
1159 * We don't _need_ to take the ilock EXCL. However, the xfs_qm_dqget
1160 * interface expects the inode to be exclusively locked because that's
1161 * the case in all other instances. It's OK that we do this because
1162 * quotacheck is done only at mount time.
1163 */
52fda114
CH
1164 error = xfs_iget(mp, NULL, ino, 0, XFS_ILOCK_EXCL, &ip);
1165 if (error) {
1da177e4 1166 *res = BULKSTAT_RV_NOTHING;
014c2544 1167 return error;
1da177e4
LT
1168 }
1169
52fda114 1170 ASSERT(ip->i_delayed_blks == 0);
1da177e4 1171
52fda114 1172 if (XFS_IS_REALTIME_INODE(ip)) {
1da177e4
LT
1173 /*
1174 * Walk thru the extent list and count the realtime blocks.
1175 */
52fda114
CH
1176 error = xfs_qm_get_rtblks(ip, &rtblks);
1177 if (error)
1178 goto error0;
1da177e4 1179 }
1da177e4 1180
52fda114 1181 nblks = (xfs_qcnt_t)ip->i_d.di_nblocks - rtblks;
1da177e4
LT
1182
1183 /*
1184 * Add the (disk blocks and inode) resources occupied by this
1185 * inode to its dquots. We do this adjustment in the incore dquot,
1186 * and also copy the changes to its buffer.
1187 * We don't care about putting these changes in a transaction
1188 * envelope because if we crash in the middle of a 'quotacheck'
1189 * we have to start from the beginning anyway.
1190 * Once we're done, we'll log all the dquot bufs.
1191 *
c41564b5 1192 * The *QUOTA_ON checks below may look pretty racy, but quotachecks
1da177e4
LT
1193 * and quotaoffs don't race. (Quotachecks happen at mount time only).
1194 */
1195 if (XFS_IS_UQUOTA_ON(mp)) {
52fda114
CH
1196 error = xfs_qm_quotacheck_dqadjust(ip, ip->i_d.di_uid,
1197 XFS_DQ_USER, nblks, rtblks);
1198 if (error)
1199 goto error0;
1da177e4 1200 }
52fda114
CH
1201
1202 if (XFS_IS_GQUOTA_ON(mp)) {
1203 error = xfs_qm_quotacheck_dqadjust(ip, ip->i_d.di_gid,
1204 XFS_DQ_GROUP, nblks, rtblks);
1205 if (error)
1206 goto error0;
1da177e4 1207 }
1da177e4 1208
52fda114 1209 if (XFS_IS_PQUOTA_ON(mp)) {
6743099c 1210 error = xfs_qm_quotacheck_dqadjust(ip, xfs_get_projid(ip),
52fda114
CH
1211 XFS_DQ_PROJ, nblks, rtblks);
1212 if (error)
1213 goto error0;
1214 }
1215
1216 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1217 IRELE(ip);
1da177e4 1218 *res = BULKSTAT_RV_DIDONE;
014c2544 1219 return 0;
52fda114
CH
1220
1221error0:
1222 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1223 IRELE(ip);
1224 *res = BULKSTAT_RV_GIVEUP;
1225 return error;
1da177e4
LT
1226}
1227
b84a3a96
CH
1228STATIC int
1229xfs_qm_flush_one(
43ff2122
CH
1230 struct xfs_dquot *dqp,
1231 void *data)
b84a3a96 1232{
43ff2122 1233 struct list_head *buffer_list = data;
fe7257fd 1234 struct xfs_buf *bp = NULL;
b84a3a96
CH
1235 int error = 0;
1236
1237 xfs_dqlock(dqp);
1238 if (dqp->dq_flags & XFS_DQ_FREEING)
1239 goto out_unlock;
1240 if (!XFS_DQ_IS_DIRTY(dqp))
1241 goto out_unlock;
1242
43ff2122 1243 xfs_dqflock(dqp);
fe7257fd
CH
1244 error = xfs_qm_dqflush(dqp, &bp);
1245 if (error)
1246 goto out_unlock;
b84a3a96 1247
43ff2122 1248 xfs_buf_delwri_queue(bp, buffer_list);
fe7257fd 1249 xfs_buf_relse(bp);
b84a3a96
CH
1250out_unlock:
1251 xfs_dqunlock(dqp);
1252 return error;
1253}
1254
1da177e4
LT
1255/*
1256 * Walk thru all the filesystem inodes and construct a consistent view
1257 * of the disk quota world. If the quotacheck fails, disable quotas.
1258 */
1259int
1260xfs_qm_quotacheck(
1261 xfs_mount_t *mp)
1262{
b84a3a96 1263 int done, count, error, error2;
1da177e4
LT
1264 xfs_ino_t lastino;
1265 size_t structsz;
1266 xfs_inode_t *uip, *gip;
1267 uint flags;
43ff2122 1268 LIST_HEAD (buffer_list);
1da177e4
LT
1269
1270 count = INT_MAX;
1271 structsz = 1;
1272 lastino = 0;
1273 flags = 0;
1274
8a7b8a89 1275 ASSERT(mp->m_quotainfo->qi_uquotaip || mp->m_quotainfo->qi_gquotaip);
1da177e4
LT
1276 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1277
0b932ccc 1278 xfs_notice(mp, "Quotacheck needed: Please wait.");
1da177e4
LT
1279
1280 /*
c8ad20ff 1281 * First we go thru all the dquots on disk, USR and GRP/PRJ, and reset
1da177e4
LT
1282 * their counters to zero. We need a clean slate.
1283 * We don't log our changes till later.
1284 */
8a7b8a89
CH
1285 uip = mp->m_quotainfo->qi_uquotaip;
1286 if (uip) {
43ff2122
CH
1287 error = xfs_qm_dqiterate(mp, uip, XFS_QMOPT_UQUOTA,
1288 &buffer_list);
8a7b8a89 1289 if (error)
1da177e4
LT
1290 goto error_return;
1291 flags |= XFS_UQUOTA_CHKD;
1292 }
1293
8a7b8a89
CH
1294 gip = mp->m_quotainfo->qi_gquotaip;
1295 if (gip) {
1296 error = xfs_qm_dqiterate(mp, gip, XFS_IS_GQUOTA_ON(mp) ?
43ff2122
CH
1297 XFS_QMOPT_GQUOTA : XFS_QMOPT_PQUOTA,
1298 &buffer_list);
8a7b8a89 1299 if (error)
1da177e4 1300 goto error_return;
c8ad20ff 1301 flags |= XFS_OQUOTA_CHKD;
1da177e4
LT
1302 }
1303
1304 do {
1305 /*
1306 * Iterate thru all the inodes in the file system,
1307 * adjusting the corresponding dquot counters in core.
1308 */
7dce11db
CH
1309 error = xfs_bulkstat(mp, &lastino, &count,
1310 xfs_qm_dqusage_adjust,
1311 structsz, NULL, &done);
1312 if (error)
1da177e4
LT
1313 break;
1314
7dce11db 1315 } while (!done);
1da177e4 1316
4b8879df 1317 /*
b84a3a96
CH
1318 * We've made all the changes that we need to make incore. Flush them
1319 * down to disk buffers if everything was updated successfully.
4b8879df 1320 */
43ff2122
CH
1321 if (XFS_IS_UQUOTA_ON(mp)) {
1322 error = xfs_qm_dquot_walk(mp, XFS_DQ_USER, xfs_qm_flush_one,
1323 &buffer_list);
1324 }
b84a3a96 1325 if (XFS_IS_GQUOTA_ON(mp)) {
43ff2122
CH
1326 error2 = xfs_qm_dquot_walk(mp, XFS_DQ_GROUP, xfs_qm_flush_one,
1327 &buffer_list);
b84a3a96
CH
1328 if (!error)
1329 error = error2;
1330 }
1331 if (XFS_IS_PQUOTA_ON(mp)) {
43ff2122
CH
1332 error2 = xfs_qm_dquot_walk(mp, XFS_DQ_PROJ, xfs_qm_flush_one,
1333 &buffer_list);
b84a3a96
CH
1334 if (!error)
1335 error = error2;
1336 }
4b8879df 1337
43ff2122
CH
1338 error2 = xfs_buf_delwri_submit(&buffer_list);
1339 if (!error)
1340 error = error2;
1341
1da177e4
LT
1342 /*
1343 * We can get this error if we couldn't do a dquot allocation inside
1344 * xfs_qm_dqusage_adjust (via bulkstat). We don't care about the
1345 * dirty dquots that might be cached, we just want to get rid of them
1346 * and turn quotaoff. The dquots won't be attached to any of the inodes
1347 * at this point (because we intentionally didn't in dqget_noattach).
1348 */
1349 if (error) {
8112e9dc 1350 xfs_qm_dqpurge_all(mp, XFS_QMOPT_QUOTALL);
1da177e4
LT
1351 goto error_return;
1352 }
1da177e4 1353
1da177e4
LT
1354 /*
1355 * If one type of quotas is off, then it will lose its
1356 * quotachecked status, since we won't be doing accounting for
1357 * that type anymore.
1358 */
4177af3a 1359 mp->m_qflags &= ~XFS_ALL_QUOTA_CHKD;
1da177e4
LT
1360 mp->m_qflags |= flags;
1361
1da177e4 1362 error_return:
43ff2122
CH
1363 while (!list_empty(&buffer_list)) {
1364 struct xfs_buf *bp =
1365 list_first_entry(&buffer_list, struct xfs_buf, b_list);
1366 list_del_init(&bp->b_list);
1367 xfs_buf_relse(bp);
1368 }
1369
1da177e4 1370 if (error) {
0b932ccc
DC
1371 xfs_warn(mp,
1372 "Quotacheck: Unsuccessful (Error %d): Disabling quotas.",
1373 error);
1da177e4
LT
1374 /*
1375 * We must turn off quotas.
1376 */
1377 ASSERT(mp->m_quotainfo != NULL);
1da177e4 1378 xfs_qm_destroy_quotainfo(mp);
31d5577b 1379 if (xfs_mount_reset_sbqflags(mp)) {
0b932ccc
DC
1380 xfs_warn(mp,
1381 "Quotacheck: Failed to reset quota flags.");
31d5577b 1382 }
0b932ccc
DC
1383 } else
1384 xfs_notice(mp, "Quotacheck: Done.");
1da177e4
LT
1385 return (error);
1386}
1387
1388/*
1389 * This is called after the superblock has been read in and we're ready to
1390 * iget the quota inodes.
1391 */
1392STATIC int
1393xfs_qm_init_quotainos(
1394 xfs_mount_t *mp)
1395{
1396 xfs_inode_t *uip, *gip;
1397 int error;
1398 __int64_t sbflags;
1399 uint flags;
1400
1401 ASSERT(mp->m_quotainfo);
1402 uip = gip = NULL;
1403 sbflags = 0;
1404 flags = 0;
1405
1406 /*
1407 * Get the uquota and gquota inodes
1408 */
62118709 1409 if (xfs_sb_version_hasquota(&mp->m_sb)) {
1da177e4
LT
1410 if (XFS_IS_UQUOTA_ON(mp) &&
1411 mp->m_sb.sb_uquotino != NULLFSINO) {
1412 ASSERT(mp->m_sb.sb_uquotino > 0);
1413 if ((error = xfs_iget(mp, NULL, mp->m_sb.sb_uquotino,
7b6259e7 1414 0, 0, &uip)))
1da177e4
LT
1415 return XFS_ERROR(error);
1416 }
c8ad20ff 1417 if (XFS_IS_OQUOTA_ON(mp) &&
1da177e4
LT
1418 mp->m_sb.sb_gquotino != NULLFSINO) {
1419 ASSERT(mp->m_sb.sb_gquotino > 0);
1420 if ((error = xfs_iget(mp, NULL, mp->m_sb.sb_gquotino,
7b6259e7 1421 0, 0, &gip))) {
1da177e4 1422 if (uip)
43355099 1423 IRELE(uip);
1da177e4
LT
1424 return XFS_ERROR(error);
1425 }
1426 }
1427 } else {
1428 flags |= XFS_QMOPT_SBVERSION;
1429 sbflags |= (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
1430 XFS_SB_GQUOTINO | XFS_SB_QFLAGS);
1431 }
1432
1433 /*
1434 * Create the two inodes, if they don't exist already. The changes
1435 * made above will get added to a transaction and logged in one of
1436 * the qino_alloc calls below. If the device is readonly,
1437 * temporarily switch to read-write to do this.
1438 */
1439 if (XFS_IS_UQUOTA_ON(mp) && uip == NULL) {
1440 if ((error = xfs_qm_qino_alloc(mp, &uip,
1441 sbflags | XFS_SB_UQUOTINO,
1442 flags | XFS_QMOPT_UQUOTA)))
1443 return XFS_ERROR(error);
1444
1445 flags &= ~XFS_QMOPT_SBVERSION;
1446 }
c8ad20ff
NS
1447 if (XFS_IS_OQUOTA_ON(mp) && gip == NULL) {
1448 flags |= (XFS_IS_GQUOTA_ON(mp) ?
1449 XFS_QMOPT_GQUOTA : XFS_QMOPT_PQUOTA);
1450 error = xfs_qm_qino_alloc(mp, &gip,
1451 sbflags | XFS_SB_GQUOTINO, flags);
1452 if (error) {
1da177e4 1453 if (uip)
43355099 1454 IRELE(uip);
1da177e4
LT
1455
1456 return XFS_ERROR(error);
1457 }
1458 }
1459
8a7b8a89
CH
1460 mp->m_quotainfo->qi_uquotaip = uip;
1461 mp->m_quotainfo->qi_gquotaip = gip;
1da177e4 1462
014c2544 1463 return 0;
1da177e4
LT
1464}
1465
92b2e5b3
CH
1466STATIC void
1467xfs_qm_dqfree_one(
1468 struct xfs_dquot *dqp)
1469{
1470 struct xfs_mount *mp = dqp->q_mount;
1471 struct xfs_quotainfo *qi = mp->m_quotainfo;
1da177e4 1472
9f920f11
CH
1473 mutex_lock(&qi->qi_tree_lock);
1474 radix_tree_delete(XFS_DQUOT_TREE(qi, dqp->q_core.d_flags),
1475 be32_to_cpu(dqp->q_core.d_id));
368e1361 1476
92b2e5b3 1477 qi->qi_dquots--;
b84a3a96 1478 mutex_unlock(&qi->qi_tree_lock);
92b2e5b3
CH
1479
1480 xfs_qm_dqdestroy(dqp);
1481}
1482
1483STATIC void
1484xfs_qm_dqreclaim_one(
1485 struct xfs_dquot *dqp,
43ff2122 1486 struct list_head *buffer_list,
92b2e5b3 1487 struct list_head *dispose_list)
1da177e4 1488{
92b2e5b3 1489 struct xfs_mount *mp = dqp->q_mount;
f8739c3c 1490 struct xfs_quotainfo *qi = mp->m_quotainfo;
92b2e5b3 1491 int error;
1da177e4 1492
92b2e5b3 1493 if (!xfs_dqlock_nowait(dqp))
b870553c 1494 goto out_move_tail;
bf72de31 1495
92b2e5b3
CH
1496 /*
1497 * This dquot has acquired a reference in the meantime remove it from
1498 * the freelist and try again.
1499 */
1500 if (dqp->q_nrefs) {
1501 xfs_dqunlock(dqp);
1da177e4 1502
92b2e5b3 1503 trace_xfs_dqreclaim_want(dqp);
48776fd2 1504 XFS_STATS_INC(xs_qm_dqwants);
1da177e4 1505
f8739c3c
CH
1506 list_del_init(&dqp->q_lru);
1507 qi->qi_lru_count--;
48776fd2 1508 XFS_STATS_DEC(xs_qm_dquot_unused);
92b2e5b3
CH
1509 return;
1510 }
368e1361 1511
92b2e5b3
CH
1512 /*
1513 * Try to grab the flush lock. If this dquot is in the process of
1514 * getting flushed to disk, we don't want to reclaim it.
1515 */
1516 if (!xfs_dqflock_nowait(dqp))
b870553c 1517 goto out_unlock_move_tail;
0b1b213f 1518
92b2e5b3 1519 if (XFS_DQ_IS_DIRTY(dqp)) {
fe7257fd
CH
1520 struct xfs_buf *bp = NULL;
1521
92b2e5b3 1522 trace_xfs_dqreclaim_dirty(dqp);
0b1b213f 1523
fe7257fd 1524 error = xfs_qm_dqflush(dqp, &bp);
92b2e5b3
CH
1525 if (error) {
1526 xfs_warn(mp, "%s: dquot %p flush failed",
1527 __func__, dqp);
b870553c 1528 goto out_unlock_move_tail;
1da177e4 1529 }
368e1361 1530
43ff2122 1531 xfs_buf_delwri_queue(bp, buffer_list);
fe7257fd 1532 xfs_buf_relse(bp);
1da177e4 1533 /*
92b2e5b3
CH
1534 * Give the dquot another try on the freelist, as the
1535 * flushing will take some time.
1da177e4 1536 */
b870553c 1537 goto out_unlock_move_tail;
92b2e5b3
CH
1538 }
1539 xfs_dqfunlock(dqp);
92678554 1540
92b2e5b3
CH
1541 /*
1542 * Prevent lookups now that we are past the point of no return.
1543 */
1544 dqp->dq_flags |= XFS_DQ_FREEING;
1545 xfs_dqunlock(dqp);
92678554 1546
92b2e5b3 1547 ASSERT(dqp->q_nrefs == 0);
f8739c3c
CH
1548 list_move_tail(&dqp->q_lru, dispose_list);
1549 qi->qi_lru_count--;
48776fd2 1550 XFS_STATS_DEC(xs_qm_dquot_unused);
92678554 1551
92b2e5b3 1552 trace_xfs_dqreclaim_done(dqp);
48776fd2 1553 XFS_STATS_INC(xs_qm_dqreclaims);
92b2e5b3 1554 return;
1da177e4 1555
92b2e5b3
CH
1556 /*
1557 * Move the dquot to the tail of the list so that we don't spin on it.
1558 */
b870553c
DC
1559out_unlock_move_tail:
1560 xfs_dqunlock(dqp);
1561out_move_tail:
f8739c3c 1562 list_move_tail(&dqp->q_lru, &qi->qi_lru_list);
92b2e5b3 1563 trace_xfs_dqreclaim_busy(dqp);
48776fd2 1564 XFS_STATS_INC(xs_qm_dqreclaim_misses);
368e1361 1565}
1da177e4 1566
1da177e4 1567STATIC int
7f8275d0 1568xfs_qm_shake(
92b2e5b3
CH
1569 struct shrinker *shrink,
1570 struct shrink_control *sc)
1da177e4 1571{
f8739c3c
CH
1572 struct xfs_quotainfo *qi =
1573 container_of(shrink, struct xfs_quotainfo, qi_shrinker);
92b2e5b3 1574 int nr_to_scan = sc->nr_to_scan;
43ff2122 1575 LIST_HEAD (buffer_list);
92b2e5b3
CH
1576 LIST_HEAD (dispose_list);
1577 struct xfs_dquot *dqp;
43ff2122 1578 int error;
1da177e4 1579
92b2e5b3 1580 if ((sc->gfp_mask & (__GFP_FS|__GFP_WAIT)) != (__GFP_FS|__GFP_WAIT))
014c2544 1581 return 0;
92b2e5b3
CH
1582 if (!nr_to_scan)
1583 goto out;
1da177e4 1584
f8739c3c
CH
1585 mutex_lock(&qi->qi_lru_lock);
1586 while (!list_empty(&qi->qi_lru_list)) {
92b2e5b3
CH
1587 if (nr_to_scan-- <= 0)
1588 break;
f8739c3c
CH
1589 dqp = list_first_entry(&qi->qi_lru_list, struct xfs_dquot,
1590 q_lru);
43ff2122 1591 xfs_qm_dqreclaim_one(dqp, &buffer_list, &dispose_list);
1da177e4 1592 }
f8739c3c 1593 mutex_unlock(&qi->qi_lru_lock);
1da177e4 1594
43ff2122
CH
1595 error = xfs_buf_delwri_submit(&buffer_list);
1596 if (error)
1597 xfs_warn(NULL, "%s: dquot reclaim failed", __func__);
1598
92b2e5b3 1599 while (!list_empty(&dispose_list)) {
f8739c3c
CH
1600 dqp = list_first_entry(&dispose_list, struct xfs_dquot, q_lru);
1601 list_del_init(&dqp->q_lru);
92b2e5b3
CH
1602 xfs_qm_dqfree_one(dqp);
1603 }
43ff2122 1604
92b2e5b3 1605out:
f8739c3c 1606 return (qi->qi_lru_count / 100) * sysctl_vfs_cache_pressure;
1da177e4
LT
1607}
1608
1da177e4
LT
1609/*
1610 * Start a transaction and write the incore superblock changes to
1611 * disk. flags parameter indicates which fields have changed.
1612 */
1613int
1614xfs_qm_write_sb_changes(
1615 xfs_mount_t *mp,
1616 __int64_t flags)
1617{
1618 xfs_trans_t *tp;
1619 int error;
1620
1da177e4 1621 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_SBCHANGE);
f910a8c6
JL
1622 error = xfs_trans_reserve(tp, 0, XFS_QM_SBCHANGE_LOG_RES(mp),
1623 0, 0, XFS_DEFAULT_LOG_COUNT);
1624 if (error) {
1da177e4 1625 xfs_trans_cancel(tp, 0);
014c2544 1626 return error;
1da177e4
LT
1627 }
1628
1629 xfs_mod_sb(tp, flags);
e5720eec 1630 error = xfs_trans_commit(tp, 0);
1da177e4 1631
e5720eec 1632 return error;
1da177e4
LT
1633}
1634
1635
1636/* --------------- utility functions for vnodeops ---------------- */
1637
1638
1639/*
6c77b0ea 1640 * Given an inode, a uid, gid and prid make sure that we have
1da177e4
LT
1641 * allocated relevant dquot(s) on disk, and that we won't exceed inode
1642 * quotas by creating this file.
1643 * This also attaches dquot(s) to the given inode after locking it,
1644 * and returns the dquots corresponding to the uid and/or gid.
1645 *
1646 * in : inode (unlocked)
1647 * out : udquot, gdquot with references taken and unlocked
1648 */
1649int
1650xfs_qm_vop_dqalloc(
7d095257
CH
1651 struct xfs_inode *ip,
1652 uid_t uid,
1653 gid_t gid,
1654 prid_t prid,
1655 uint flags,
1656 struct xfs_dquot **O_udqpp,
1657 struct xfs_dquot **O_gdqpp)
1da177e4 1658{
7d095257
CH
1659 struct xfs_mount *mp = ip->i_mount;
1660 struct xfs_dquot *uq, *gq;
1661 int error;
1662 uint lockflags;
1da177e4 1663
7d095257 1664 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
1da177e4
LT
1665 return 0;
1666
1667 lockflags = XFS_ILOCK_EXCL;
1668 xfs_ilock(ip, lockflags);
1669
bd186aa9 1670 if ((flags & XFS_QMOPT_INHERIT) && XFS_INHERIT_GID(ip))
1da177e4
LT
1671 gid = ip->i_d.di_gid;
1672
1673 /*
1674 * Attach the dquot(s) to this inode, doing a dquot allocation
1675 * if necessary. The dquot(s) will not be locked.
1676 */
1677 if (XFS_NOT_DQATTACHED(mp, ip)) {
7d095257
CH
1678 error = xfs_qm_dqattach_locked(ip, XFS_QMOPT_DQALLOC);
1679 if (error) {
1da177e4 1680 xfs_iunlock(ip, lockflags);
014c2544 1681 return error;
1da177e4
LT
1682 }
1683 }
1684
1685 uq = gq = NULL;
c8ad20ff 1686 if ((flags & XFS_QMOPT_UQUOTA) && XFS_IS_UQUOTA_ON(mp)) {
1da177e4
LT
1687 if (ip->i_d.di_uid != uid) {
1688 /*
1689 * What we need is the dquot that has this uid, and
1690 * if we send the inode to dqget, the uid of the inode
1691 * takes priority over what's sent in the uid argument.
1692 * We must unlock inode here before calling dqget if
1693 * we're not sending the inode, because otherwise
1694 * we'll deadlock by doing trans_reserve while
1695 * holding ilock.
1696 */
1697 xfs_iunlock(ip, lockflags);
1698 if ((error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t) uid,
1699 XFS_DQ_USER,
1700 XFS_QMOPT_DQALLOC |
1701 XFS_QMOPT_DOWARN,
1702 &uq))) {
1703 ASSERT(error != ENOENT);
014c2544 1704 return error;
1da177e4
LT
1705 }
1706 /*
1707 * Get the ilock in the right order.
1708 */
1709 xfs_dqunlock(uq);
1710 lockflags = XFS_ILOCK_SHARED;
1711 xfs_ilock(ip, lockflags);
1712 } else {
1713 /*
1714 * Take an extra reference, because we'll return
1715 * this to caller
1716 */
1717 ASSERT(ip->i_udquot);
78e55892 1718 uq = xfs_qm_dqhold(ip->i_udquot);
1da177e4
LT
1719 }
1720 }
c8ad20ff 1721 if ((flags & XFS_QMOPT_GQUOTA) && XFS_IS_GQUOTA_ON(mp)) {
1da177e4
LT
1722 if (ip->i_d.di_gid != gid) {
1723 xfs_iunlock(ip, lockflags);
1724 if ((error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t)gid,
1725 XFS_DQ_GROUP,
1726 XFS_QMOPT_DQALLOC |
1727 XFS_QMOPT_DOWARN,
1728 &gq))) {
1729 if (uq)
1730 xfs_qm_dqrele(uq);
1731 ASSERT(error != ENOENT);
014c2544 1732 return error;
1da177e4
LT
1733 }
1734 xfs_dqunlock(gq);
1735 lockflags = XFS_ILOCK_SHARED;
1736 xfs_ilock(ip, lockflags);
1737 } else {
1738 ASSERT(ip->i_gdquot);
78e55892 1739 gq = xfs_qm_dqhold(ip->i_gdquot);
1da177e4 1740 }
c8ad20ff 1741 } else if ((flags & XFS_QMOPT_PQUOTA) && XFS_IS_PQUOTA_ON(mp)) {
6743099c 1742 if (xfs_get_projid(ip) != prid) {
c8ad20ff
NS
1743 xfs_iunlock(ip, lockflags);
1744 if ((error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t)prid,
1745 XFS_DQ_PROJ,
1746 XFS_QMOPT_DQALLOC |
1747 XFS_QMOPT_DOWARN,
1748 &gq))) {
1749 if (uq)
1750 xfs_qm_dqrele(uq);
1751 ASSERT(error != ENOENT);
1752 return (error);
1753 }
1754 xfs_dqunlock(gq);
1755 lockflags = XFS_ILOCK_SHARED;
1756 xfs_ilock(ip, lockflags);
1757 } else {
1758 ASSERT(ip->i_gdquot);
78e55892 1759 gq = xfs_qm_dqhold(ip->i_gdquot);
c8ad20ff 1760 }
1da177e4
LT
1761 }
1762 if (uq)
0b1b213f 1763 trace_xfs_dquot_dqalloc(ip);
1da177e4
LT
1764
1765 xfs_iunlock(ip, lockflags);
1766 if (O_udqpp)
1767 *O_udqpp = uq;
1768 else if (uq)
1769 xfs_qm_dqrele(uq);
1770 if (O_gdqpp)
1771 *O_gdqpp = gq;
1772 else if (gq)
1773 xfs_qm_dqrele(gq);
014c2544 1774 return 0;
1da177e4
LT
1775}
1776
1777/*
1778 * Actually transfer ownership, and do dquot modifications.
1779 * These were already reserved.
1780 */
1781xfs_dquot_t *
1782xfs_qm_vop_chown(
1783 xfs_trans_t *tp,
1784 xfs_inode_t *ip,
1785 xfs_dquot_t **IO_olddq,
1786 xfs_dquot_t *newdq)
1787{
1788 xfs_dquot_t *prevdq;
06d10dd9
NS
1789 uint bfield = XFS_IS_REALTIME_INODE(ip) ?
1790 XFS_TRANS_DQ_RTBCOUNT : XFS_TRANS_DQ_BCOUNT;
1791
7d095257 1792
579aa9ca 1793 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
1794 ASSERT(XFS_IS_QUOTA_RUNNING(ip->i_mount));
1795
1796 /* old dquot */
1797 prevdq = *IO_olddq;
1798 ASSERT(prevdq);
1799 ASSERT(prevdq != newdq);
1800
06d10dd9
NS
1801 xfs_trans_mod_dquot(tp, prevdq, bfield, -(ip->i_d.di_nblocks));
1802 xfs_trans_mod_dquot(tp, prevdq, XFS_TRANS_DQ_ICOUNT, -1);
1da177e4
LT
1803
1804 /* the sparkling new dquot */
06d10dd9
NS
1805 xfs_trans_mod_dquot(tp, newdq, bfield, ip->i_d.di_nblocks);
1806 xfs_trans_mod_dquot(tp, newdq, XFS_TRANS_DQ_ICOUNT, 1);
1da177e4
LT
1807
1808 /*
78e55892
CH
1809 * Take an extra reference, because the inode is going to keep
1810 * this dquot pointer even after the trans_commit.
1da177e4 1811 */
78e55892 1812 *IO_olddq = xfs_qm_dqhold(newdq);
1da177e4 1813
014c2544 1814 return prevdq;
1da177e4
LT
1815}
1816
1817/*
c8ad20ff 1818 * Quota reservations for setattr(AT_UID|AT_GID|AT_PROJID).
1da177e4
LT
1819 */
1820int
1821xfs_qm_vop_chown_reserve(
1822 xfs_trans_t *tp,
1823 xfs_inode_t *ip,
1824 xfs_dquot_t *udqp,
1825 xfs_dquot_t *gdqp,
1826 uint flags)
1827{
7d095257 1828 xfs_mount_t *mp = ip->i_mount;
9a2a7de2 1829 uint delblks, blkflags, prjflags = 0;
1da177e4 1830 xfs_dquot_t *unresudq, *unresgdq, *delblksudq, *delblksgdq;
7d095257
CH
1831 int error;
1832
1da177e4 1833
579aa9ca 1834 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL|XFS_ILOCK_SHARED));
1da177e4
LT
1835 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1836
1837 delblks = ip->i_delayed_blks;
1838 delblksudq = delblksgdq = unresudq = unresgdq = NULL;
06d10dd9
NS
1839 blkflags = XFS_IS_REALTIME_INODE(ip) ?
1840 XFS_QMOPT_RES_RTBLKS : XFS_QMOPT_RES_REGBLKS;
1da177e4
LT
1841
1842 if (XFS_IS_UQUOTA_ON(mp) && udqp &&
1149d96a 1843 ip->i_d.di_uid != (uid_t)be32_to_cpu(udqp->q_core.d_id)) {
1da177e4
LT
1844 delblksudq = udqp;
1845 /*
1846 * If there are delayed allocation blocks, then we have to
1847 * unreserve those from the old dquot, and add them to the
1848 * new dquot.
1849 */
1850 if (delblks) {
1851 ASSERT(ip->i_udquot);
1852 unresudq = ip->i_udquot;
1853 }
1854 }
c8ad20ff 1855 if (XFS_IS_OQUOTA_ON(ip->i_mount) && gdqp) {
9a2a7de2 1856 if (XFS_IS_PQUOTA_ON(ip->i_mount) &&
6743099c 1857 xfs_get_projid(ip) != be32_to_cpu(gdqp->q_core.d_id))
9a2a7de2
NS
1858 prjflags = XFS_QMOPT_ENOSPC;
1859
1860 if (prjflags ||
1861 (XFS_IS_GQUOTA_ON(ip->i_mount) &&
1862 ip->i_d.di_gid != be32_to_cpu(gdqp->q_core.d_id))) {
c8ad20ff
NS
1863 delblksgdq = gdqp;
1864 if (delblks) {
1865 ASSERT(ip->i_gdquot);
1866 unresgdq = ip->i_gdquot;
1867 }
1da177e4
LT
1868 }
1869 }
1870
1871 if ((error = xfs_trans_reserve_quota_bydquots(tp, ip->i_mount,
1872 delblksudq, delblksgdq, ip->i_d.di_nblocks, 1,
9a2a7de2 1873 flags | blkflags | prjflags)))
1da177e4
LT
1874 return (error);
1875
1876 /*
1877 * Do the delayed blks reservations/unreservations now. Since, these
1878 * are done without the help of a transaction, if a reservation fails
1879 * its previous reservations won't be automatically undone by trans
1880 * code. So, we have to do it manually here.
1881 */
1882 if (delblks) {
1883 /*
1884 * Do the reservations first. Unreservation can't fail.
1885 */
1886 ASSERT(delblksudq || delblksgdq);
1887 ASSERT(unresudq || unresgdq);
1888 if ((error = xfs_trans_reserve_quota_bydquots(NULL, ip->i_mount,
1889 delblksudq, delblksgdq, (xfs_qcnt_t)delblks, 0,
9a2a7de2 1890 flags | blkflags | prjflags)))
1da177e4
LT
1891 return (error);
1892 xfs_trans_reserve_quota_bydquots(NULL, ip->i_mount,
1893 unresudq, unresgdq, -((xfs_qcnt_t)delblks), 0,
06d10dd9 1894 blkflags);
1da177e4
LT
1895 }
1896
1897 return (0);
1898}
1899
1900int
1901xfs_qm_vop_rename_dqattach(
7d095257 1902 struct xfs_inode **i_tab)
1da177e4 1903{
7d095257
CH
1904 struct xfs_mount *mp = i_tab[0]->i_mount;
1905 int i;
1da177e4 1906
7d095257 1907 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
014c2544 1908 return 0;
1da177e4 1909
7d095257
CH
1910 for (i = 0; (i < 4 && i_tab[i]); i++) {
1911 struct xfs_inode *ip = i_tab[i];
1912 int error;
1913
1da177e4
LT
1914 /*
1915 * Watch out for duplicate entries in the table.
1916 */
7d095257
CH
1917 if (i == 0 || ip != i_tab[i-1]) {
1918 if (XFS_NOT_DQATTACHED(mp, ip)) {
1da177e4
LT
1919 error = xfs_qm_dqattach(ip, 0);
1920 if (error)
014c2544 1921 return error;
1da177e4
LT
1922 }
1923 }
1924 }
014c2544 1925 return 0;
1da177e4
LT
1926}
1927
1928void
7d095257
CH
1929xfs_qm_vop_create_dqattach(
1930 struct xfs_trans *tp,
1931 struct xfs_inode *ip,
1932 struct xfs_dquot *udqp,
1933 struct xfs_dquot *gdqp)
1da177e4 1934{
7d095257
CH
1935 struct xfs_mount *mp = tp->t_mountp;
1936
1937 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
1da177e4
LT
1938 return;
1939
579aa9ca 1940 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
7d095257 1941 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1da177e4
LT
1942
1943 if (udqp) {
1da177e4 1944 ASSERT(ip->i_udquot == NULL);
7d095257 1945 ASSERT(XFS_IS_UQUOTA_ON(mp));
1149d96a 1946 ASSERT(ip->i_d.di_uid == be32_to_cpu(udqp->q_core.d_id));
78e55892
CH
1947
1948 ip->i_udquot = xfs_qm_dqhold(udqp);
1da177e4
LT
1949 xfs_trans_mod_dquot(tp, udqp, XFS_TRANS_DQ_ICOUNT, 1);
1950 }
1951 if (gdqp) {
1da177e4 1952 ASSERT(ip->i_gdquot == NULL);
7d095257
CH
1953 ASSERT(XFS_IS_OQUOTA_ON(mp));
1954 ASSERT((XFS_IS_GQUOTA_ON(mp) ?
6743099c 1955 ip->i_d.di_gid : xfs_get_projid(ip)) ==
ee2a4f7c 1956 be32_to_cpu(gdqp->q_core.d_id));
78e55892
CH
1957
1958 ip->i_gdquot = xfs_qm_dqhold(gdqp);
1da177e4
LT
1959 xfs_trans_mod_dquot(tp, gdqp, XFS_TRANS_DQ_ICOUNT, 1);
1960 }
1961}
1962