]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - fs/xfs/xfs_qm.c
xfs: fix dquot isolation hang
[mirror_ubuntu-artful-kernel.git] / fs / xfs / xfs_qm.c
CommitLineData
1da177e4 1/*
4ce3121f
NS
2 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
3 * All Rights Reserved.
1da177e4 4 *
4ce3121f
NS
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
1da177e4
LT
7 * published by the Free Software Foundation.
8 *
4ce3121f
NS
9 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
1da177e4 13 *
4ce3121f
NS
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
1da177e4 17 */
1da177e4
LT
18#include "xfs.h"
19#include "xfs_fs.h"
6ca1c906 20#include "xfs_format.h"
a844f451 21#include "xfs_bit.h"
1da177e4 22#include "xfs_log.h"
1da177e4
LT
23#include "xfs_trans.h"
24#include "xfs_sb.h"
25#include "xfs_ag.h"
1da177e4 26#include "xfs_alloc.h"
1da177e4
LT
27#include "xfs_quota.h"
28#include "xfs_mount.h"
1da177e4
LT
29#include "xfs_bmap_btree.h"
30#include "xfs_ialloc_btree.h"
1da177e4
LT
31#include "xfs_dinode.h"
32#include "xfs_inode.h"
a844f451
NS
33#include "xfs_ialloc.h"
34#include "xfs_itable.h"
1da177e4
LT
35#include "xfs_rtalloc.h"
36#include "xfs_error.h"
a844f451 37#include "xfs_bmap.h"
1da177e4
LT
38#include "xfs_attr.h"
39#include "xfs_buf_item.h"
40#include "xfs_trans_space.h"
1da177e4 41#include "xfs_qm.h"
0b1b213f 42#include "xfs_trace.h"
33479e05 43#include "xfs_icache.h"
6fcdc59d 44#include "xfs_cksum.h"
1da177e4
LT
45
46/*
47 * The global quota manager. There is only one of these for the entire
48 * system, _not_ one per file system. XQM keeps track of the overall
49 * quota functionality, including maintaining the freelist and hash
50 * tables of dquots.
51 */
1da177e4 52STATIC int xfs_qm_init_quotainos(xfs_mount_t *);
ba0f32d4 53STATIC int xfs_qm_init_quotainfo(xfs_mount_t *);
1da177e4 54
cd56a39a
DC
55
56STATIC void xfs_qm_dqfree_one(struct xfs_dquot *dqp);
b84a3a96
CH
57/*
58 * We use the batch lookup interface to iterate over the dquots as it
59 * currently is the only interface into the radix tree code that allows
60 * fuzzy lookups instead of exact matches. Holding the lock over multiple
61 * operations is fine as all callers are used either during mount/umount
62 * or quotaoff.
63 */
64#define XFS_DQ_LOOKUP_BATCH 32
65
66STATIC int
67xfs_qm_dquot_walk(
68 struct xfs_mount *mp,
69 int type,
43ff2122
CH
70 int (*execute)(struct xfs_dquot *dqp, void *data),
71 void *data)
b84a3a96
CH
72{
73 struct xfs_quotainfo *qi = mp->m_quotainfo;
329e0875 74 struct radix_tree_root *tree = xfs_dquot_tree(qi, type);
b84a3a96
CH
75 uint32_t next_index;
76 int last_error = 0;
77 int skipped;
78 int nr_found;
79
80restart:
81 skipped = 0;
82 next_index = 0;
83 nr_found = 0;
84
85 while (1) {
86 struct xfs_dquot *batch[XFS_DQ_LOOKUP_BATCH];
87 int error = 0;
88 int i;
89
90 mutex_lock(&qi->qi_tree_lock);
91 nr_found = radix_tree_gang_lookup(tree, (void **)batch,
92 next_index, XFS_DQ_LOOKUP_BATCH);
93 if (!nr_found) {
94 mutex_unlock(&qi->qi_tree_lock);
95 break;
96 }
97
98 for (i = 0; i < nr_found; i++) {
99 struct xfs_dquot *dqp = batch[i];
100
101 next_index = be32_to_cpu(dqp->q_core.d_id) + 1;
102
43ff2122 103 error = execute(batch[i], data);
b84a3a96
CH
104 if (error == EAGAIN) {
105 skipped++;
106 continue;
107 }
108 if (error && last_error != EFSCORRUPTED)
109 last_error = error;
110 }
111
112 mutex_unlock(&qi->qi_tree_lock);
113
114 /* bail out if the filesystem is corrupted. */
115 if (last_error == EFSCORRUPTED) {
116 skipped = 0;
117 break;
118 }
119 }
120
121 if (skipped) {
122 delay(1);
123 goto restart;
124 }
125
126 return last_error;
127}
128
129
130/*
131 * Purge a dquot from all tracking data structures and free it.
132 */
133STATIC int
134xfs_qm_dqpurge(
43ff2122
CH
135 struct xfs_dquot *dqp,
136 void *data)
b84a3a96
CH
137{
138 struct xfs_mount *mp = dqp->q_mount;
139 struct xfs_quotainfo *qi = mp->m_quotainfo;
140 struct xfs_dquot *gdqp = NULL;
92f8ff73 141 struct xfs_dquot *pdqp = NULL;
b84a3a96
CH
142
143 xfs_dqlock(dqp);
144 if ((dqp->dq_flags & XFS_DQ_FREEING) || dqp->q_nrefs != 0) {
145 xfs_dqunlock(dqp);
146 return EAGAIN;
147 }
148
149 /*
92f8ff73 150 * If this quota has a hint attached, prepare for releasing it now.
b84a3a96
CH
151 */
152 gdqp = dqp->q_gdquot;
153 if (gdqp) {
154 xfs_dqlock(gdqp);
155 dqp->q_gdquot = NULL;
156 }
157
92f8ff73
CS
158 pdqp = dqp->q_pdquot;
159 if (pdqp) {
160 xfs_dqlock(pdqp);
161 dqp->q_pdquot = NULL;
162 }
163
b84a3a96
CH
164 dqp->dq_flags |= XFS_DQ_FREEING;
165
43ff2122 166 xfs_dqflock(dqp);
b84a3a96
CH
167
168 /*
169 * If we are turning this type of quotas off, we don't care
170 * about the dirty metadata sitting in this dquot. OTOH, if
171 * we're unmounting, we do care, so we flush it and wait.
172 */
173 if (XFS_DQ_IS_DIRTY(dqp)) {
fe7257fd
CH
174 struct xfs_buf *bp = NULL;
175 int error;
b84a3a96
CH
176
177 /*
178 * We don't care about getting disk errors here. We need
179 * to purge this dquot anyway, so we go ahead regardless.
180 */
fe7257fd
CH
181 error = xfs_qm_dqflush(dqp, &bp);
182 if (error) {
b84a3a96
CH
183 xfs_warn(mp, "%s: dquot %p flush failed",
184 __func__, dqp);
fe7257fd
CH
185 } else {
186 error = xfs_bwrite(bp);
187 xfs_buf_relse(bp);
188 }
b84a3a96
CH
189 xfs_dqflock(dqp);
190 }
191
192 ASSERT(atomic_read(&dqp->q_pincount) == 0);
193 ASSERT(XFS_FORCED_SHUTDOWN(mp) ||
194 !(dqp->q_logitem.qli_item.li_flags & XFS_LI_IN_AIL));
195
196 xfs_dqfunlock(dqp);
197 xfs_dqunlock(dqp);
198
329e0875 199 radix_tree_delete(xfs_dquot_tree(qi, dqp->q_core.d_flags),
b84a3a96
CH
200 be32_to_cpu(dqp->q_core.d_id));
201 qi->qi_dquots--;
202
203 /*
204 * We move dquots to the freelist as soon as their reference count
205 * hits zero, so it really should be on the freelist here.
206 */
b84a3a96 207 ASSERT(!list_empty(&dqp->q_lru));
cd56a39a 208 list_lru_del(&qi->qi_lru, &dqp->q_lru);
b84a3a96 209 XFS_STATS_DEC(xs_qm_dquot_unused);
b84a3a96
CH
210
211 xfs_qm_dqdestroy(dqp);
212
213 if (gdqp)
214 xfs_qm_dqput(gdqp);
92f8ff73
CS
215 if (pdqp)
216 xfs_qm_dqput(pdqp);
b84a3a96
CH
217 return 0;
218}
219
220/*
221 * Purge the dquot cache.
222 */
223void
224xfs_qm_dqpurge_all(
225 struct xfs_mount *mp,
226 uint flags)
227{
228 if (flags & XFS_QMOPT_UQUOTA)
43ff2122 229 xfs_qm_dquot_walk(mp, XFS_DQ_USER, xfs_qm_dqpurge, NULL);
b84a3a96 230 if (flags & XFS_QMOPT_GQUOTA)
43ff2122 231 xfs_qm_dquot_walk(mp, XFS_DQ_GROUP, xfs_qm_dqpurge, NULL);
b84a3a96 232 if (flags & XFS_QMOPT_PQUOTA)
43ff2122 233 xfs_qm_dquot_walk(mp, XFS_DQ_PROJ, xfs_qm_dqpurge, NULL);
b84a3a96
CH
234}
235
1da177e4
LT
236/*
237 * Just destroy the quotainfo structure.
238 */
239void
7d095257
CH
240xfs_qm_unmount(
241 struct xfs_mount *mp)
1da177e4 242{
7d095257 243 if (mp->m_quotainfo) {
8112e9dc 244 xfs_qm_dqpurge_all(mp, XFS_QMOPT_QUOTALL);
1da177e4 245 xfs_qm_destroy_quotainfo(mp);
7d095257 246 }
1da177e4
LT
247}
248
249
250/*
251 * This is called from xfs_mountfs to start quotas and initialize all
252 * necessary data structures like quotainfo. This is also responsible for
253 * running a quotacheck as necessary. We are guaranteed that the superblock
254 * is consistently read in at this point.
53aa7915
DC
255 *
256 * If we fail here, the mount will continue with quota turned off. We don't
257 * need to inidicate success or failure at all.
1da177e4 258 */
53aa7915 259void
1da177e4 260xfs_qm_mount_quotas(
4249023a 261 xfs_mount_t *mp)
1da177e4 262{
1da177e4
LT
263 int error = 0;
264 uint sbf;
265
1da177e4
LT
266 /*
267 * If quotas on realtime volumes is not supported, we disable
268 * quotas immediately.
269 */
270 if (mp->m_sb.sb_rextents) {
0b932ccc 271 xfs_notice(mp, "Cannot turn on quotas for realtime filesystem");
1da177e4
LT
272 mp->m_qflags = 0;
273 goto write_changes;
274 }
275
1da177e4 276 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
155ffd07 277
1da177e4
LT
278 /*
279 * Allocate the quotainfo structure inside the mount struct, and
280 * create quotainode(s), and change/rev superblock if necessary.
281 */
53aa7915
DC
282 error = xfs_qm_init_quotainfo(mp);
283 if (error) {
1da177e4
LT
284 /*
285 * We must turn off quotas.
286 */
287 ASSERT(mp->m_quotainfo == NULL);
288 mp->m_qflags = 0;
289 goto write_changes;
290 }
291 /*
292 * If any of the quotas are not consistent, do a quotacheck.
293 */
4249023a 294 if (XFS_QM_NEED_QUOTACHECK(mp)) {
53aa7915
DC
295 error = xfs_qm_quotacheck(mp);
296 if (error) {
297 /* Quotacheck failed and disabled quotas. */
298 return;
1da177e4 299 }
1da177e4 300 }
646d5bda
DD
301 /*
302 * If one type of quotas is off, then it will lose its
303 * quotachecked status, since we won't be doing accounting for
304 * that type anymore.
305 */
53aa7915 306 if (!XFS_IS_UQUOTA_ON(mp))
646d5bda 307 mp->m_qflags &= ~XFS_UQUOTA_CHKD;
83e782e1
CS
308 if (!XFS_IS_GQUOTA_ON(mp))
309 mp->m_qflags &= ~XFS_GQUOTA_CHKD;
310 if (!XFS_IS_PQUOTA_ON(mp))
311 mp->m_qflags &= ~XFS_PQUOTA_CHKD;
155ffd07 312
1da177e4
LT
313 write_changes:
314 /*
3685c2a1 315 * We actually don't have to acquire the m_sb_lock at all.
1da177e4
LT
316 * This can only be called from mount, and that's single threaded. XXX
317 */
3685c2a1 318 spin_lock(&mp->m_sb_lock);
1da177e4
LT
319 sbf = mp->m_sb.sb_qflags;
320 mp->m_sb.sb_qflags = mp->m_qflags & XFS_MOUNT_QUOTA_ALL;
3685c2a1 321 spin_unlock(&mp->m_sb_lock);
1da177e4
LT
322
323 if (sbf != (mp->m_qflags & XFS_MOUNT_QUOTA_ALL)) {
324 if (xfs_qm_write_sb_changes(mp, XFS_SB_QFLAGS)) {
325 /*
326 * We could only have been turning quotas off.
327 * We aren't in very good shape actually because
328 * the incore structures are convinced that quotas are
329 * off, but the on disk superblock doesn't know that !
330 */
331 ASSERT(!(XFS_IS_QUOTA_RUNNING(mp)));
53487786
DC
332 xfs_alert(mp, "%s: Superblock update failed!",
333 __func__);
1da177e4
LT
334 }
335 }
336
337 if (error) {
53487786 338 xfs_warn(mp, "Failed to initialize disk quotas.");
7d095257 339 return;
1da177e4 340 }
1da177e4
LT
341}
342
343/*
344 * Called from the vfsops layer.
345 */
e57481dc 346void
1da177e4
LT
347xfs_qm_unmount_quotas(
348 xfs_mount_t *mp)
349{
1da177e4
LT
350 /*
351 * Release the dquots that root inode, et al might be holding,
352 * before we flush quotas and blow away the quotainfo structure.
353 */
354 ASSERT(mp->m_rootip);
355 xfs_qm_dqdetach(mp->m_rootip);
356 if (mp->m_rbmip)
357 xfs_qm_dqdetach(mp->m_rbmip);
358 if (mp->m_rsumip)
359 xfs_qm_dqdetach(mp->m_rsumip);
360
361 /*
e57481dc 362 * Release the quota inodes.
1da177e4 363 */
1da177e4 364 if (mp->m_quotainfo) {
e57481dc
CH
365 if (mp->m_quotainfo->qi_uquotaip) {
366 IRELE(mp->m_quotainfo->qi_uquotaip);
367 mp->m_quotainfo->qi_uquotaip = NULL;
1da177e4 368 }
e57481dc
CH
369 if (mp->m_quotainfo->qi_gquotaip) {
370 IRELE(mp->m_quotainfo->qi_gquotaip);
371 mp->m_quotainfo->qi_gquotaip = NULL;
1da177e4 372 }
92f8ff73
CS
373 if (mp->m_quotainfo->qi_pquotaip) {
374 IRELE(mp->m_quotainfo->qi_pquotaip);
375 mp->m_quotainfo->qi_pquotaip = NULL;
376 }
1da177e4 377 }
1da177e4
LT
378}
379
1da177e4
LT
380STATIC int
381xfs_qm_dqattach_one(
382 xfs_inode_t *ip,
383 xfs_dqid_t id,
384 uint type,
385 uint doalloc,
1da177e4
LT
386 xfs_dquot_t *udqhint, /* hint */
387 xfs_dquot_t **IO_idqpp)
388{
389 xfs_dquot_t *dqp;
390 int error;
391
579aa9ca 392 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4 393 error = 0;
8e9b6e7f 394
1da177e4
LT
395 /*
396 * See if we already have it in the inode itself. IO_idqpp is
397 * &i_udquot or &i_gdquot. This made the code look weird, but
398 * made the logic a lot simpler.
399 */
8e9b6e7f
CH
400 dqp = *IO_idqpp;
401 if (dqp) {
0b1b213f 402 trace_xfs_dqattach_found(dqp);
8e9b6e7f 403 return 0;
1da177e4
LT
404 }
405
406 /*
407 * udqhint is the i_udquot field in inode, and is non-NULL only
c8ad20ff 408 * when the type arg is group/project. Its purpose is to save a
1da177e4
LT
409 * lookup by dqid (xfs_qm_dqget) by caching a group dquot inside
410 * the user dquot.
411 */
8e9b6e7f
CH
412 if (udqhint) {
413 ASSERT(type == XFS_DQ_GROUP || type == XFS_DQ_PROJ);
1da177e4
LT
414 xfs_dqlock(udqhint);
415
8e9b6e7f
CH
416 /*
417 * No need to take dqlock to look at the id.
418 *
419 * The ID can't change until it gets reclaimed, and it won't
420 * be reclaimed as long as we have a ref from inode and we
421 * hold the ilock.
422 */
92f8ff73
CS
423 if (type == XFS_DQ_GROUP)
424 dqp = udqhint->q_gdquot;
425 else
426 dqp = udqhint->q_pdquot;
8e9b6e7f 427 if (dqp && be32_to_cpu(dqp->q_core.d_id) == id) {
8e9b6e7f 428 ASSERT(*IO_idqpp == NULL);
8e9b6e7f 429
78e55892 430 *IO_idqpp = xfs_qm_dqhold(dqp);
1da177e4 431 xfs_dqunlock(udqhint);
8e9b6e7f 432 return 0;
1da177e4 433 }
8e9b6e7f
CH
434
435 /*
436 * We can't hold a dquot lock when we call the dqget code.
437 * We'll deadlock in no time, because of (not conforming to)
438 * lock ordering - the inodelock comes before any dquot lock,
439 * and we may drop and reacquire the ilock in xfs_qm_dqget().
440 */
1da177e4 441 xfs_dqunlock(udqhint);
8e9b6e7f
CH
442 }
443
1da177e4
LT
444 /*
445 * Find the dquot from somewhere. This bumps the
446 * reference count of dquot and returns it locked.
447 * This can return ENOENT if dquot didn't exist on
448 * disk and we didn't ask it to allocate;
449 * ESRCH if quotas got turned off suddenly.
450 */
db3e74b5
MH
451 error = xfs_qm_dqget(ip->i_mount, ip, id, type,
452 doalloc | XFS_QMOPT_DOWARN, &dqp);
8e9b6e7f
CH
453 if (error)
454 return error;
1da177e4 455
0b1b213f 456 trace_xfs_dqattach_get(dqp);
8e9b6e7f 457
1da177e4
LT
458 /*
459 * dqget may have dropped and re-acquired the ilock, but it guarantees
460 * that the dquot returned is the one that should go in the inode.
461 */
462 *IO_idqpp = dqp;
8e9b6e7f
CH
463 xfs_dqunlock(dqp);
464 return 0;
1da177e4
LT
465}
466
467
468/*
92f8ff73
CS
469 * Given a udquot and group/project type, attach the group/project
470 * dquot pointer to the udquot as a hint for future lookups.
1da177e4
LT
471 */
472STATIC void
92f8ff73
CS
473xfs_qm_dqattach_hint(
474 struct xfs_inode *ip,
475 int type)
1da177e4 476{
92f8ff73
CS
477 struct xfs_dquot **dqhintp;
478 struct xfs_dquot *dqp;
479 struct xfs_dquot *udq = ip->i_udquot;
480
481 ASSERT(type == XFS_DQ_GROUP || type == XFS_DQ_PROJ);
1da177e4 482
8e9b6e7f 483 xfs_dqlock(udq);
1da177e4 484
92f8ff73
CS
485 if (type == XFS_DQ_GROUP) {
486 dqp = ip->i_gdquot;
487 dqhintp = &udq->q_gdquot;
488 } else {
489 dqp = ip->i_pdquot;
490 dqhintp = &udq->q_pdquot;
491 }
492
493 if (*dqhintp) {
494 struct xfs_dquot *tmp;
495
496 if (*dqhintp == dqp)
ab680bb7 497 goto done;
1da177e4 498
92f8ff73
CS
499 tmp = *dqhintp;
500 *dqhintp = NULL;
1da177e4 501 xfs_qm_dqrele(tmp);
1da177e4 502 }
8e9b6e7f 503
92f8ff73 504 *dqhintp = xfs_qm_dqhold(dqp);
ab680bb7 505done:
8e9b6e7f 506 xfs_dqunlock(udq);
1da177e4
LT
507}
508
b4d05e30
CH
509static bool
510xfs_qm_need_dqattach(
511 struct xfs_inode *ip)
512{
513 struct xfs_mount *mp = ip->i_mount;
514
515 if (!XFS_IS_QUOTA_RUNNING(mp))
516 return false;
517 if (!XFS_IS_QUOTA_ON(mp))
518 return false;
519 if (!XFS_NOT_DQATTACHED(mp, ip))
520 return false;
9cad19d2 521 if (xfs_is_quota_inode(&mp->m_sb, ip->i_ino))
b4d05e30
CH
522 return false;
523 return true;
524}
1da177e4
LT
525
526/*
c8ad20ff
NS
527 * Given a locked inode, attach dquot(s) to it, taking U/G/P-QUOTAON
528 * into account.
1da177e4 529 * If XFS_QMOPT_DQALLOC, the dquot(s) will be allocated if needed.
1da177e4
LT
530 * Inode may get unlocked and relocked in here, and the caller must deal with
531 * the consequences.
532 */
533int
7d095257 534xfs_qm_dqattach_locked(
1da177e4
LT
535 xfs_inode_t *ip,
536 uint flags)
537{
538 xfs_mount_t *mp = ip->i_mount;
539 uint nquotas = 0;
540 int error = 0;
541
b4d05e30 542 if (!xfs_qm_need_dqattach(ip))
014c2544 543 return 0;
1da177e4 544
7d095257 545 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
546
547 if (XFS_IS_UQUOTA_ON(mp)) {
548 error = xfs_qm_dqattach_one(ip, ip->i_d.di_uid, XFS_DQ_USER,
549 flags & XFS_QMOPT_DQALLOC,
1da177e4
LT
550 NULL, &ip->i_udquot);
551 if (error)
552 goto done;
553 nquotas++;
554 }
579aa9ca
CH
555
556 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
92f8ff73
CS
557 if (XFS_IS_GQUOTA_ON(mp)) {
558 error = xfs_qm_dqattach_one(ip, ip->i_d.di_gid, XFS_DQ_GROUP,
1da177e4 559 flags & XFS_QMOPT_DQALLOC,
1da177e4
LT
560 ip->i_udquot, &ip->i_gdquot);
561 /*
562 * Don't worry about the udquot that we may have
563 * attached above. It'll get detached, if not already.
564 */
565 if (error)
566 goto done;
567 nquotas++;
568 }
569
92f8ff73
CS
570 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
571 if (XFS_IS_PQUOTA_ON(mp)) {
572 error = xfs_qm_dqattach_one(ip, xfs_get_projid(ip), XFS_DQ_PROJ,
573 flags & XFS_QMOPT_DQALLOC,
574 ip->i_udquot, &ip->i_pdquot);
575 /*
576 * Don't worry about the udquot that we may have
577 * attached above. It'll get detached, if not already.
578 */
579 if (error)
580 goto done;
581 nquotas++;
582 }
583
1da177e4 584 /*
92f8ff73 585 * Attach this group/project quota to the user quota as a hint.
1da177e4
LT
586 * This WON'T, in general, result in a thrash.
587 */
92f8ff73 588 if (nquotas > 1 && ip->i_udquot) {
579aa9ca 589 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
92f8ff73
CS
590 ASSERT(ip->i_gdquot || !XFS_IS_GQUOTA_ON(mp));
591 ASSERT(ip->i_pdquot || !XFS_IS_PQUOTA_ON(mp));
1da177e4
LT
592
593 /*
ab680bb7
CH
594 * We do not have i_udquot locked at this point, but this check
595 * is OK since we don't depend on the i_gdquot to be accurate
596 * 100% all the time. It is just a hint, and this will
597 * succeed in general.
1da177e4 598 */
ab680bb7 599 if (ip->i_udquot->q_gdquot != ip->i_gdquot)
92f8ff73
CS
600 xfs_qm_dqattach_hint(ip, XFS_DQ_GROUP);
601
602 if (ip->i_udquot->q_pdquot != ip->i_pdquot)
603 xfs_qm_dqattach_hint(ip, XFS_DQ_PROJ);
1da177e4
LT
604 }
605
7d095257 606 done:
ea15ab3c
CH
607#ifdef DEBUG
608 if (!error) {
1da177e4
LT
609 if (XFS_IS_UQUOTA_ON(mp))
610 ASSERT(ip->i_udquot);
92f8ff73 611 if (XFS_IS_GQUOTA_ON(mp))
1da177e4 612 ASSERT(ip->i_gdquot);
92f8ff73
CS
613 if (XFS_IS_PQUOTA_ON(mp))
614 ASSERT(ip->i_pdquot);
1da177e4 615 }
7d095257 616 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4 617#endif
7d095257
CH
618 return error;
619}
1da177e4 620
7d095257
CH
621int
622xfs_qm_dqattach(
623 struct xfs_inode *ip,
624 uint flags)
625{
626 int error;
627
b4d05e30
CH
628 if (!xfs_qm_need_dqattach(ip))
629 return 0;
630
7d095257
CH
631 xfs_ilock(ip, XFS_ILOCK_EXCL);
632 error = xfs_qm_dqattach_locked(ip, flags);
633 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1da177e4 634
014c2544 635 return error;
1da177e4
LT
636}
637
638/*
639 * Release dquots (and their references) if any.
640 * The inode should be locked EXCL except when this's called by
641 * xfs_ireclaim.
642 */
643void
644xfs_qm_dqdetach(
645 xfs_inode_t *ip)
646{
92f8ff73 647 if (!(ip->i_udquot || ip->i_gdquot || ip->i_pdquot))
1da177e4
LT
648 return;
649
0b1b213f
CH
650 trace_xfs_dquot_dqdetach(ip);
651
9cad19d2 652 ASSERT(!xfs_is_quota_inode(&ip->i_mount->m_sb, ip->i_ino));
1da177e4
LT
653 if (ip->i_udquot) {
654 xfs_qm_dqrele(ip->i_udquot);
655 ip->i_udquot = NULL;
656 }
657 if (ip->i_gdquot) {
658 xfs_qm_dqrele(ip->i_gdquot);
659 ip->i_gdquot = NULL;
660 }
92f8ff73
CS
661 if (ip->i_pdquot) {
662 xfs_qm_dqrele(ip->i_pdquot);
663 ip->i_pdquot = NULL;
664 }
1da177e4
LT
665}
666
3fe58f30
CH
667int
668xfs_qm_calc_dquots_per_chunk(
669 struct xfs_mount *mp,
670 unsigned int nbblks) /* basic block units */
671{
672 unsigned int ndquots;
673
674 ASSERT(nbblks > 0);
675 ndquots = BBTOB(nbblks);
676 do_div(ndquots, sizeof(xfs_dqblk_t));
677
678 return ndquots;
679}
680
cd56a39a
DC
681struct xfs_qm_isolate {
682 struct list_head buffers;
683 struct list_head dispose;
684};
685
686static enum lru_status
687xfs_qm_dquot_isolate(
688 struct list_head *item,
689 spinlock_t *lru_lock,
690 void *arg)
691{
692 struct xfs_dquot *dqp = container_of(item,
693 struct xfs_dquot, q_lru);
694 struct xfs_qm_isolate *isol = arg;
695
696 if (!xfs_dqlock_nowait(dqp))
697 goto out_miss_busy;
698
699 /*
700 * This dquot has acquired a reference in the meantime remove it from
701 * the freelist and try again.
702 */
703 if (dqp->q_nrefs) {
704 xfs_dqunlock(dqp);
705 XFS_STATS_INC(xs_qm_dqwants);
706
707 trace_xfs_dqreclaim_want(dqp);
708 list_del_init(&dqp->q_lru);
709 XFS_STATS_DEC(xs_qm_dquot_unused);
35163417 710 return LRU_REMOVED;
cd56a39a
DC
711 }
712
713 /*
714 * If the dquot is dirty, flush it. If it's already being flushed, just
715 * skip it so there is time for the IO to complete before we try to
716 * reclaim it again on the next LRU pass.
717 */
718 if (!xfs_dqflock_nowait(dqp)) {
719 xfs_dqunlock(dqp);
720 goto out_miss_busy;
721 }
722
723 if (XFS_DQ_IS_DIRTY(dqp)) {
724 struct xfs_buf *bp = NULL;
725 int error;
726
727 trace_xfs_dqreclaim_dirty(dqp);
728
729 /* we have to drop the LRU lock to flush the dquot */
730 spin_unlock(lru_lock);
731
732 error = xfs_qm_dqflush(dqp, &bp);
733 if (error) {
734 xfs_warn(dqp->q_mount, "%s: dquot %p flush failed",
735 __func__, dqp);
736 goto out_unlock_dirty;
737 }
738
739 xfs_buf_delwri_queue(bp, &isol->buffers);
740 xfs_buf_relse(bp);
741 goto out_unlock_dirty;
742 }
743 xfs_dqfunlock(dqp);
744
745 /*
746 * Prevent lookups now that we are past the point of no return.
747 */
748 dqp->dq_flags |= XFS_DQ_FREEING;
749 xfs_dqunlock(dqp);
750
751 ASSERT(dqp->q_nrefs == 0);
752 list_move_tail(&dqp->q_lru, &isol->dispose);
753 XFS_STATS_DEC(xs_qm_dquot_unused);
754 trace_xfs_dqreclaim_done(dqp);
755 XFS_STATS_INC(xs_qm_dqreclaims);
35163417 756 return LRU_REMOVED;
cd56a39a
DC
757
758out_miss_busy:
759 trace_xfs_dqreclaim_busy(dqp);
760 XFS_STATS_INC(xs_qm_dqreclaim_misses);
35163417 761 return LRU_SKIP;
cd56a39a
DC
762
763out_unlock_dirty:
764 trace_xfs_dqreclaim_busy(dqp);
765 XFS_STATS_INC(xs_qm_dqreclaim_misses);
35163417
DC
766 xfs_dqunlock(dqp);
767 spin_lock(lru_lock);
768 return LRU_RETRY;
cd56a39a
DC
769}
770
2f5b56f8 771static unsigned long
cd56a39a
DC
772xfs_qm_shrink_scan(
773 struct shrinker *shrink,
774 struct shrink_control *sc)
775{
776 struct xfs_quotainfo *qi = container_of(shrink,
777 struct xfs_quotainfo, qi_shrinker);
778 struct xfs_qm_isolate isol;
2f5b56f8 779 unsigned long freed;
cd56a39a
DC
780 int error;
781 unsigned long nr_to_scan = sc->nr_to_scan;
782
783 if ((sc->gfp_mask & (__GFP_FS|__GFP_WAIT)) != (__GFP_FS|__GFP_WAIT))
784 return 0;
785
786 INIT_LIST_HEAD(&isol.buffers);
787 INIT_LIST_HEAD(&isol.dispose);
788
789 freed = list_lru_walk_node(&qi->qi_lru, sc->nid, xfs_qm_dquot_isolate, &isol,
790 &nr_to_scan);
791
792 error = xfs_buf_delwri_submit(&isol.buffers);
793 if (error)
794 xfs_warn(NULL, "%s: dquot reclaim failed", __func__);
795
796 while (!list_empty(&isol.dispose)) {
797 struct xfs_dquot *dqp;
798
799 dqp = list_first_entry(&isol.dispose, struct xfs_dquot, q_lru);
800 list_del_init(&dqp->q_lru);
801 xfs_qm_dqfree_one(dqp);
802 }
803
804 return freed;
805}
806
2f5b56f8 807static unsigned long
cd56a39a
DC
808xfs_qm_shrink_count(
809 struct shrinker *shrink,
810 struct shrink_control *sc)
811{
812 struct xfs_quotainfo *qi = container_of(shrink,
813 struct xfs_quotainfo, qi_shrinker);
814
815 return list_lru_count_node(&qi->qi_lru, sc->nid);
816}
817
1da177e4
LT
818/*
819 * This initializes all the quota information that's kept in the
820 * mount structure
821 */
ba0f32d4 822STATIC int
1da177e4
LT
823xfs_qm_init_quotainfo(
824 xfs_mount_t *mp)
825{
826 xfs_quotainfo_t *qinf;
827 int error;
828 xfs_dquot_t *dqp;
829
830 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
831
1da177e4
LT
832 qinf = mp->m_quotainfo = kmem_zalloc(sizeof(xfs_quotainfo_t), KM_SLEEP);
833
834 /*
835 * See if quotainodes are setup, and if not, allocate them,
836 * and change the superblock accordingly.
837 */
838 if ((error = xfs_qm_init_quotainos(mp))) {
f0e2d93c 839 kmem_free(qinf);
1da177e4 840 mp->m_quotainfo = NULL;
014c2544 841 return error;
1da177e4
LT
842 }
843
9f920f11
CH
844 INIT_RADIX_TREE(&qinf->qi_uquota_tree, GFP_NOFS);
845 INIT_RADIX_TREE(&qinf->qi_gquota_tree, GFP_NOFS);
92f8ff73 846 INIT_RADIX_TREE(&qinf->qi_pquota_tree, GFP_NOFS);
9f920f11
CH
847 mutex_init(&qinf->qi_tree_lock);
848
cd56a39a 849 list_lru_init(&qinf->qi_lru);
f8739c3c 850
1da177e4 851 /* mutex used to serialize quotaoffs */
794ee1ba 852 mutex_init(&qinf->qi_quotaofflock);
1da177e4
LT
853
854 /* Precalc some constants */
855 qinf->qi_dqchunklen = XFS_FSB_TO_BB(mp, XFS_DQUOT_CLUSTER_SIZE_FSB);
3fe58f30
CH
856 qinf->qi_dqperchunk = xfs_qm_calc_dquots_per_chunk(mp,
857 qinf->qi_dqchunklen);
1da177e4
LT
858
859 mp->m_qflags |= (mp->m_sb.sb_qflags & XFS_ALL_QUOTA_CHKD);
860
861 /*
862 * We try to get the limits from the superuser's limits fields.
863 * This is quite hacky, but it is standard quota practice.
7ae44407 864 *
1da177e4
LT
865 * We look at the USR dquot with id == 0 first, but if user quotas
866 * are not enabled we goto the GRP dquot with id == 0.
867 * We don't really care to keep separate default limits for user
868 * and group quotas, at least not at this point.
7ae44407
CH
869 *
870 * Since we may not have done a quotacheck by this point, just read
871 * the dquot without attaching it to any hashtables or lists.
1da177e4 872 */
7ae44407
CH
873 error = xfs_qm_dqread(mp, 0,
874 XFS_IS_UQUOTA_RUNNING(mp) ? XFS_DQ_USER :
875 (XFS_IS_GQUOTA_RUNNING(mp) ? XFS_DQ_GROUP :
876 XFS_DQ_PROJ),
877 XFS_QMOPT_DOWARN, &dqp);
878 if (!error) {
1da177e4
LT
879 xfs_disk_dquot_t *ddqp = &dqp->q_core;
880
881 /*
882 * The warnings and timers set the grace period given to
883 * a user or group before he or she can not perform any
884 * more writing. If it is zero, a default is used.
885 */
1149d96a
CH
886 qinf->qi_btimelimit = ddqp->d_btimer ?
887 be32_to_cpu(ddqp->d_btimer) : XFS_QM_BTIMELIMIT;
888 qinf->qi_itimelimit = ddqp->d_itimer ?
889 be32_to_cpu(ddqp->d_itimer) : XFS_QM_ITIMELIMIT;
890 qinf->qi_rtbtimelimit = ddqp->d_rtbtimer ?
891 be32_to_cpu(ddqp->d_rtbtimer) : XFS_QM_RTBTIMELIMIT;
892 qinf->qi_bwarnlimit = ddqp->d_bwarns ?
893 be16_to_cpu(ddqp->d_bwarns) : XFS_QM_BWARNLIMIT;
894 qinf->qi_iwarnlimit = ddqp->d_iwarns ?
895 be16_to_cpu(ddqp->d_iwarns) : XFS_QM_IWARNLIMIT;
896 qinf->qi_rtbwarnlimit = ddqp->d_rtbwarns ?
897 be16_to_cpu(ddqp->d_rtbwarns) : XFS_QM_RTBWARNLIMIT;
898 qinf->qi_bhardlimit = be64_to_cpu(ddqp->d_blk_hardlimit);
899 qinf->qi_bsoftlimit = be64_to_cpu(ddqp->d_blk_softlimit);
900 qinf->qi_ihardlimit = be64_to_cpu(ddqp->d_ino_hardlimit);
901 qinf->qi_isoftlimit = be64_to_cpu(ddqp->d_ino_softlimit);
902 qinf->qi_rtbhardlimit = be64_to_cpu(ddqp->d_rtb_hardlimit);
903 qinf->qi_rtbsoftlimit = be64_to_cpu(ddqp->d_rtb_softlimit);
1da177e4 904
1da177e4
LT
905 xfs_qm_dqdestroy(dqp);
906 } else {
907 qinf->qi_btimelimit = XFS_QM_BTIMELIMIT;
908 qinf->qi_itimelimit = XFS_QM_ITIMELIMIT;
909 qinf->qi_rtbtimelimit = XFS_QM_RTBTIMELIMIT;
910 qinf->qi_bwarnlimit = XFS_QM_BWARNLIMIT;
911 qinf->qi_iwarnlimit = XFS_QM_IWARNLIMIT;
06d10dd9 912 qinf->qi_rtbwarnlimit = XFS_QM_RTBWARNLIMIT;
1da177e4
LT
913 }
914
cd56a39a
DC
915 qinf->qi_shrinker.count_objects = xfs_qm_shrink_count;
916 qinf->qi_shrinker.scan_objects = xfs_qm_shrink_scan;
f8739c3c 917 qinf->qi_shrinker.seeks = DEFAULT_SEEKS;
cd56a39a 918 qinf->qi_shrinker.flags = SHRINKER_NUMA_AWARE;
f8739c3c 919 register_shrinker(&qinf->qi_shrinker);
014c2544 920 return 0;
1da177e4
LT
921}
922
923
924/*
925 * Gets called when unmounting a filesystem or when all quotas get
926 * turned off.
927 * This purges the quota inodes, destroys locks and frees itself.
928 */
929void
930xfs_qm_destroy_quotainfo(
931 xfs_mount_t *mp)
932{
933 xfs_quotainfo_t *qi;
934
935 qi = mp->m_quotainfo;
936 ASSERT(qi != NULL);
1da177e4 937
f8739c3c
CH
938 unregister_shrinker(&qi->qi_shrinker);
939
1da177e4 940 if (qi->qi_uquotaip) {
26cc0021 941 IRELE(qi->qi_uquotaip);
1da177e4
LT
942 qi->qi_uquotaip = NULL; /* paranoia */
943 }
944 if (qi->qi_gquotaip) {
26cc0021 945 IRELE(qi->qi_gquotaip);
1da177e4
LT
946 qi->qi_gquotaip = NULL;
947 }
92f8ff73
CS
948 if (qi->qi_pquotaip) {
949 IRELE(qi->qi_pquotaip);
950 qi->qi_pquotaip = NULL;
951 }
1da177e4 952 mutex_destroy(&qi->qi_quotaofflock);
f0e2d93c 953 kmem_free(qi);
1da177e4
LT
954 mp->m_quotainfo = NULL;
955}
956
1da177e4
LT
957/*
958 * Create an inode and return with a reference already taken, but unlocked
959 * This is how we create quota inodes
960 */
961STATIC int
962xfs_qm_qino_alloc(
963 xfs_mount_t *mp,
964 xfs_inode_t **ip,
965 __int64_t sbfields,
966 uint flags)
967{
968 xfs_trans_t *tp;
969 int error;
1da177e4
LT
970 int committed;
971
d892d586
CS
972 *ip = NULL;
973 /*
974 * With superblock that doesn't have separate pquotino, we
975 * share an inode between gquota and pquota. If the on-disk
976 * superblock has GQUOTA and the filesystem is now mounted
977 * with PQUOTA, just use sb_gquotino for sb_pquotino and
978 * vice-versa.
979 */
980 if (!xfs_sb_version_has_pquotino(&mp->m_sb) &&
981 (flags & (XFS_QMOPT_PQUOTA|XFS_QMOPT_GQUOTA))) {
982 xfs_ino_t ino = NULLFSINO;
983
984 if ((flags & XFS_QMOPT_PQUOTA) &&
985 (mp->m_sb.sb_gquotino != NULLFSINO)) {
986 ino = mp->m_sb.sb_gquotino;
987 ASSERT(mp->m_sb.sb_pquotino == NULLFSINO);
988 } else if ((flags & XFS_QMOPT_GQUOTA) &&
989 (mp->m_sb.sb_pquotino != NULLFSINO)) {
990 ino = mp->m_sb.sb_pquotino;
991 ASSERT(mp->m_sb.sb_gquotino == NULLFSINO);
992 }
993 if (ino != NULLFSINO) {
994 error = xfs_iget(mp, NULL, ino, 0, 0, ip);
995 if (error)
996 return error;
997 mp->m_sb.sb_gquotino = NULLFSINO;
998 mp->m_sb.sb_pquotino = NULLFSINO;
999 }
1000 }
1001
061f7209 1002 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_QINOCREATE);
3d3c8b52
JL
1003 error = xfs_trans_reserve(tp, &M_RES(mp)->tr_create,
1004 XFS_QM_QINOCREATE_SPACE_RES(mp), 0);
1005 if (error) {
1da177e4 1006 xfs_trans_cancel(tp, 0);
014c2544 1007 return error;
1da177e4 1008 }
1da177e4 1009
d892d586
CS
1010 if (!*ip) {
1011 error = xfs_dir_ialloc(&tp, NULL, S_IFREG, 1, 0, 0, 1, ip,
1012 &committed);
1013 if (error) {
1014 xfs_trans_cancel(tp, XFS_TRANS_RELEASE_LOG_RES |
1015 XFS_TRANS_ABORT);
1016 return error;
1017 }
1da177e4
LT
1018 }
1019
1da177e4
LT
1020 /*
1021 * Make the changes in the superblock, and log those too.
1022 * sbfields arg may contain fields other than *QUOTINO;
1023 * VERSIONNUM for example.
1024 */
3685c2a1 1025 spin_lock(&mp->m_sb_lock);
1da177e4 1026 if (flags & XFS_QMOPT_SBVERSION) {
62118709 1027 ASSERT(!xfs_sb_version_hasquota(&mp->m_sb));
1da177e4 1028 ASSERT((sbfields & (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
d892d586
CS
1029 XFS_SB_GQUOTINO | XFS_SB_PQUOTINO | XFS_SB_QFLAGS)) ==
1030 (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
1031 XFS_SB_GQUOTINO | XFS_SB_PQUOTINO |
1032 XFS_SB_QFLAGS));
1da177e4 1033
62118709 1034 xfs_sb_version_addquota(&mp->m_sb);
1da177e4
LT
1035 mp->m_sb.sb_uquotino = NULLFSINO;
1036 mp->m_sb.sb_gquotino = NULLFSINO;
d892d586 1037 mp->m_sb.sb_pquotino = NULLFSINO;
1da177e4 1038
d892d586
CS
1039 /* qflags will get updated fully _after_ quotacheck */
1040 mp->m_sb.sb_qflags = mp->m_qflags & XFS_ALL_QUOTA_ACCT;
1da177e4
LT
1041 }
1042 if (flags & XFS_QMOPT_UQUOTA)
1043 mp->m_sb.sb_uquotino = (*ip)->i_ino;
d892d586 1044 else if (flags & XFS_QMOPT_GQUOTA)
1da177e4 1045 mp->m_sb.sb_gquotino = (*ip)->i_ino;
d892d586
CS
1046 else
1047 mp->m_sb.sb_pquotino = (*ip)->i_ino;
3685c2a1 1048 spin_unlock(&mp->m_sb_lock);
1da177e4
LT
1049 xfs_mod_sb(tp, sbfields);
1050
1c72bf90 1051 if ((error = xfs_trans_commit(tp, XFS_TRANS_RELEASE_LOG_RES))) {
53487786 1052 xfs_alert(mp, "%s failed (error %d)!", __func__, error);
014c2544 1053 return error;
1da177e4 1054 }
014c2544 1055 return 0;
1da177e4
LT
1056}
1057
1058
5b139738 1059STATIC void
1da177e4
LT
1060xfs_qm_reset_dqcounts(
1061 xfs_mount_t *mp,
1062 xfs_buf_t *bp,
1063 xfs_dqid_t id,
1064 uint type)
1065{
6fcdc59d 1066 struct xfs_dqblk *dqb;
1da177e4
LT
1067 int j;
1068
0b1b213f
CH
1069 trace_xfs_reset_dqcounts(bp, _RET_IP_);
1070
1da177e4
LT
1071 /*
1072 * Reset all counters and timers. They'll be
1073 * started afresh by xfs_qm_quotacheck.
1074 */
1075#ifdef DEBUG
1076 j = XFS_FSB_TO_B(mp, XFS_DQUOT_CLUSTER_SIZE_FSB);
1077 do_div(j, sizeof(xfs_dqblk_t));
8a7b8a89 1078 ASSERT(mp->m_quotainfo->qi_dqperchunk == j);
1da177e4 1079#endif
6fcdc59d 1080 dqb = bp->b_addr;
8a7b8a89 1081 for (j = 0; j < mp->m_quotainfo->qi_dqperchunk; j++) {
6fcdc59d
DC
1082 struct xfs_disk_dquot *ddq;
1083
1084 ddq = (struct xfs_disk_dquot *)&dqb[j];
1085
1da177e4
LT
1086 /*
1087 * Do a sanity check, and if needed, repair the dqblk. Don't
1088 * output any warnings because it's perfectly possible to
c41564b5 1089 * find uninitialised dquot blks. See comment in xfs_qm_dqcheck.
1da177e4 1090 */
a0fa2b67 1091 (void) xfs_qm_dqcheck(mp, ddq, id+j, type, XFS_QMOPT_DQREPAIR,
1da177e4 1092 "xfs_quotacheck");
1149d96a
CH
1093 ddq->d_bcount = 0;
1094 ddq->d_icount = 0;
1095 ddq->d_rtbcount = 0;
1096 ddq->d_btimer = 0;
1097 ddq->d_itimer = 0;
1098 ddq->d_rtbtimer = 0;
1099 ddq->d_bwarns = 0;
1100 ddq->d_iwarns = 0;
1101 ddq->d_rtbwarns = 0;
6fcdc59d
DC
1102
1103 if (xfs_sb_version_hascrc(&mp->m_sb)) {
1104 xfs_update_cksum((char *)&dqb[j],
1105 sizeof(struct xfs_dqblk),
1106 XFS_DQUOT_CRC_OFF);
1107 }
1da177e4 1108 }
1da177e4
LT
1109}
1110
1111STATIC int
1112xfs_qm_dqiter_bufs(
43ff2122
CH
1113 struct xfs_mount *mp,
1114 xfs_dqid_t firstid,
1115 xfs_fsblock_t bno,
1116 xfs_filblks_t blkcnt,
1117 uint flags,
1118 struct list_head *buffer_list)
1da177e4 1119{
43ff2122
CH
1120 struct xfs_buf *bp;
1121 int error;
1122 int type;
1da177e4
LT
1123
1124 ASSERT(blkcnt > 0);
c8ad20ff
NS
1125 type = flags & XFS_QMOPT_UQUOTA ? XFS_DQ_USER :
1126 (flags & XFS_QMOPT_PQUOTA ? XFS_DQ_PROJ : XFS_DQ_GROUP);
1da177e4
LT
1127 error = 0;
1128
1129 /*
1130 * Blkcnt arg can be a very big number, and might even be
1131 * larger than the log itself. So, we have to break it up into
1132 * manageable-sized transactions.
1133 * Note that we don't start a permanent transaction here; we might
1134 * not be able to get a log reservation for the whole thing up front,
1135 * and we don't really care to either, because we just discard
1136 * everything if we were to crash in the middle of this loop.
1137 */
1138 while (blkcnt--) {
1139 error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp,
1140 XFS_FSB_TO_DADDR(mp, bno),
c6319198 1141 mp->m_quotainfo->qi_dqchunklen, 0, &bp,
1813dd64 1142 &xfs_dquot_buf_ops);
1da177e4 1143
3fe58f30 1144 /*
6fcdc59d
DC
1145 * CRC and validation errors will return a EFSCORRUPTED here. If
1146 * this occurs, re-read without CRC validation so that we can
1147 * repair the damage via xfs_qm_reset_dqcounts(). This process
1148 * will leave a trace in the log indicating corruption has
1149 * been detected.
3fe58f30 1150 */
6fcdc59d
DC
1151 if (error == EFSCORRUPTED) {
1152 error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp,
1153 XFS_FSB_TO_DADDR(mp, bno),
1154 mp->m_quotainfo->qi_dqchunklen, 0, &bp,
1155 NULL);
1156 }
1157
1158 if (error)
1159 break;
1160
5b139738 1161 xfs_qm_reset_dqcounts(mp, bp, firstid, type);
43ff2122 1162 xfs_buf_delwri_queue(bp, buffer_list);
61551f1e 1163 xfs_buf_relse(bp);
6fcdc59d
DC
1164
1165 /* goto the next block. */
1da177e4 1166 bno++;
8a7b8a89 1167 firstid += mp->m_quotainfo->qi_dqperchunk;
1da177e4 1168 }
43ff2122 1169
014c2544 1170 return error;
1da177e4
LT
1171}
1172
1173/*
c8ad20ff 1174 * Iterate over all allocated USR/GRP/PRJ dquots in the system, calling a
1da177e4
LT
1175 * caller supplied function for every chunk of dquots that we find.
1176 */
1177STATIC int
1178xfs_qm_dqiterate(
43ff2122
CH
1179 struct xfs_mount *mp,
1180 struct xfs_inode *qip,
1181 uint flags,
1182 struct list_head *buffer_list)
1da177e4 1183{
43ff2122 1184 struct xfs_bmbt_irec *map;
1da177e4
LT
1185 int i, nmaps; /* number of map entries */
1186 int error; /* return value */
1187 xfs_fileoff_t lblkno;
1188 xfs_filblks_t maxlblkcnt;
1189 xfs_dqid_t firstid;
1190 xfs_fsblock_t rablkno;
1191 xfs_filblks_t rablkcnt;
1192
1193 error = 0;
1194 /*
c41564b5 1195 * This looks racy, but we can't keep an inode lock across a
1da177e4
LT
1196 * trans_reserve. But, this gets called during quotacheck, and that
1197 * happens only at mount time which is single threaded.
1198 */
1199 if (qip->i_d.di_nblocks == 0)
014c2544 1200 return 0;
1da177e4
LT
1201
1202 map = kmem_alloc(XFS_DQITER_MAP_SIZE * sizeof(*map), KM_SLEEP);
1203
1204 lblkno = 0;
32972383 1205 maxlblkcnt = XFS_B_TO_FSB(mp, mp->m_super->s_maxbytes);
1da177e4
LT
1206 do {
1207 nmaps = XFS_DQITER_MAP_SIZE;
1208 /*
1209 * We aren't changing the inode itself. Just changing
1210 * some of its data. No new blocks are added here, and
1211 * the inode is never added to the transaction.
1212 */
1213 xfs_ilock(qip, XFS_ILOCK_SHARED);
5c8ed202
DC
1214 error = xfs_bmapi_read(qip, lblkno, maxlblkcnt - lblkno,
1215 map, &nmaps, 0);
1da177e4
LT
1216 xfs_iunlock(qip, XFS_ILOCK_SHARED);
1217 if (error)
1218 break;
1219
1220 ASSERT(nmaps <= XFS_DQITER_MAP_SIZE);
1221 for (i = 0; i < nmaps; i++) {
1222 ASSERT(map[i].br_startblock != DELAYSTARTBLOCK);
1223 ASSERT(map[i].br_blockcount);
1224
1225
1226 lblkno += map[i].br_blockcount;
1227
1228 if (map[i].br_startblock == HOLESTARTBLOCK)
1229 continue;
1230
1231 firstid = (xfs_dqid_t) map[i].br_startoff *
8a7b8a89 1232 mp->m_quotainfo->qi_dqperchunk;
1da177e4
LT
1233 /*
1234 * Do a read-ahead on the next extent.
1235 */
1236 if ((i+1 < nmaps) &&
1237 (map[i+1].br_startblock != HOLESTARTBLOCK)) {
1238 rablkcnt = map[i+1].br_blockcount;
1239 rablkno = map[i+1].br_startblock;
1240 while (rablkcnt--) {
1a1a3e97 1241 xfs_buf_readahead(mp->m_ddev_targp,
1da177e4 1242 XFS_FSB_TO_DADDR(mp, rablkno),
c3f8fc73
DC
1243 mp->m_quotainfo->qi_dqchunklen,
1244 NULL);
1da177e4
LT
1245 rablkno++;
1246 }
1247 }
1248 /*
1249 * Iterate thru all the blks in the extent and
1250 * reset the counters of all the dquots inside them.
1251 */
43ff2122
CH
1252 error = xfs_qm_dqiter_bufs(mp, firstid,
1253 map[i].br_startblock,
1254 map[i].br_blockcount,
1255 flags, buffer_list);
1256 if (error)
1257 goto out;
1da177e4 1258 }
1da177e4
LT
1259 } while (nmaps > 0);
1260
43ff2122 1261out:
f0e2d93c 1262 kmem_free(map);
014c2544 1263 return error;
1da177e4
LT
1264}
1265
1266/*
1267 * Called by dqusage_adjust in doing a quotacheck.
52fda114
CH
1268 *
1269 * Given the inode, and a dquot id this updates both the incore dqout as well
1270 * as the buffer copy. This is so that once the quotacheck is done, we can
1271 * just log all the buffers, as opposed to logging numerous updates to
1272 * individual dquots.
1da177e4 1273 */
52fda114 1274STATIC int
1da177e4 1275xfs_qm_quotacheck_dqadjust(
52fda114
CH
1276 struct xfs_inode *ip,
1277 xfs_dqid_t id,
1278 uint type,
1da177e4
LT
1279 xfs_qcnt_t nblks,
1280 xfs_qcnt_t rtblks)
1281{
52fda114
CH
1282 struct xfs_mount *mp = ip->i_mount;
1283 struct xfs_dquot *dqp;
1284 int error;
1285
1286 error = xfs_qm_dqget(mp, ip, id, type,
1287 XFS_QMOPT_DQALLOC | XFS_QMOPT_DOWARN, &dqp);
1288 if (error) {
1289 /*
1290 * Shouldn't be able to turn off quotas here.
1291 */
1292 ASSERT(error != ESRCH);
1293 ASSERT(error != ENOENT);
1294 return error;
1295 }
0b1b213f
CH
1296
1297 trace_xfs_dqadjust(dqp);
1298
1da177e4
LT
1299 /*
1300 * Adjust the inode count and the block count to reflect this inode's
1301 * resource usage.
1302 */
413d57c9 1303 be64_add_cpu(&dqp->q_core.d_icount, 1);
1da177e4
LT
1304 dqp->q_res_icount++;
1305 if (nblks) {
413d57c9 1306 be64_add_cpu(&dqp->q_core.d_bcount, nblks);
1da177e4
LT
1307 dqp->q_res_bcount += nblks;
1308 }
1309 if (rtblks) {
413d57c9 1310 be64_add_cpu(&dqp->q_core.d_rtbcount, rtblks);
1da177e4
LT
1311 dqp->q_res_rtbcount += rtblks;
1312 }
1313
1314 /*
1315 * Set default limits, adjust timers (since we changed usages)
191f8488
CH
1316 *
1317 * There are no timers for the default values set in the root dquot.
1da177e4 1318 */
191f8488 1319 if (dqp->q_core.d_id) {
4b6eae2e 1320 xfs_qm_adjust_dqlimits(mp, dqp);
52fda114 1321 xfs_qm_adjust_dqtimers(mp, &dqp->q_core);
1da177e4
LT
1322 }
1323
1324 dqp->dq_flags |= XFS_DQ_DIRTY;
52fda114
CH
1325 xfs_qm_dqput(dqp);
1326 return 0;
1da177e4
LT
1327}
1328
1329STATIC int
1330xfs_qm_get_rtblks(
1331 xfs_inode_t *ip,
1332 xfs_qcnt_t *O_rtblks)
1333{
1334 xfs_filblks_t rtblks; /* total rt blks */
4eea22f0 1335 xfs_extnum_t idx; /* extent record index */
1da177e4
LT
1336 xfs_ifork_t *ifp; /* inode fork pointer */
1337 xfs_extnum_t nextents; /* number of extent entries */
1da177e4
LT
1338 int error;
1339
1340 ASSERT(XFS_IS_REALTIME_INODE(ip));
1341 ifp = XFS_IFORK_PTR(ip, XFS_DATA_FORK);
1342 if (!(ifp->if_flags & XFS_IFEXTENTS)) {
1343 if ((error = xfs_iread_extents(NULL, ip, XFS_DATA_FORK)))
014c2544 1344 return error;
1da177e4
LT
1345 }
1346 rtblks = 0;
4eea22f0 1347 nextents = ifp->if_bytes / (uint)sizeof(xfs_bmbt_rec_t);
a6f64d4a
CH
1348 for (idx = 0; idx < nextents; idx++)
1349 rtblks += xfs_bmbt_get_blockcount(xfs_iext_get_ext(ifp, idx));
1da177e4 1350 *O_rtblks = (xfs_qcnt_t)rtblks;
014c2544 1351 return 0;
1da177e4
LT
1352}
1353
1354/*
1355 * callback routine supplied to bulkstat(). Given an inumber, find its
1356 * dquots and update them to account for resources taken by that inode.
1357 */
1358/* ARGSUSED */
1359STATIC int
1360xfs_qm_dqusage_adjust(
1361 xfs_mount_t *mp, /* mount point for filesystem */
1362 xfs_ino_t ino, /* inode number to get data for */
1363 void __user *buffer, /* not used */
1364 int ubsize, /* not used */
1da177e4 1365 int *ubused, /* not used */
1da177e4
LT
1366 int *res) /* result code value */
1367{
1368 xfs_inode_t *ip;
52fda114 1369 xfs_qcnt_t nblks, rtblks = 0;
1da177e4
LT
1370 int error;
1371
1372 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1373
1374 /*
1375 * rootino must have its resources accounted for, not so with the quota
1376 * inodes.
1377 */
9cad19d2 1378 if (xfs_is_quota_inode(&mp->m_sb, ino)) {
1da177e4
LT
1379 *res = BULKSTAT_RV_NOTHING;
1380 return XFS_ERROR(EINVAL);
1381 }
1382
1383 /*
1384 * We don't _need_ to take the ilock EXCL. However, the xfs_qm_dqget
1385 * interface expects the inode to be exclusively locked because that's
1386 * the case in all other instances. It's OK that we do this because
1387 * quotacheck is done only at mount time.
1388 */
52fda114
CH
1389 error = xfs_iget(mp, NULL, ino, 0, XFS_ILOCK_EXCL, &ip);
1390 if (error) {
1da177e4 1391 *res = BULKSTAT_RV_NOTHING;
014c2544 1392 return error;
1da177e4
LT
1393 }
1394
52fda114 1395 ASSERT(ip->i_delayed_blks == 0);
1da177e4 1396
52fda114 1397 if (XFS_IS_REALTIME_INODE(ip)) {
1da177e4
LT
1398 /*
1399 * Walk thru the extent list and count the realtime blocks.
1400 */
52fda114
CH
1401 error = xfs_qm_get_rtblks(ip, &rtblks);
1402 if (error)
1403 goto error0;
1da177e4 1404 }
1da177e4 1405
52fda114 1406 nblks = (xfs_qcnt_t)ip->i_d.di_nblocks - rtblks;
1da177e4
LT
1407
1408 /*
1409 * Add the (disk blocks and inode) resources occupied by this
1410 * inode to its dquots. We do this adjustment in the incore dquot,
1411 * and also copy the changes to its buffer.
1412 * We don't care about putting these changes in a transaction
1413 * envelope because if we crash in the middle of a 'quotacheck'
1414 * we have to start from the beginning anyway.
1415 * Once we're done, we'll log all the dquot bufs.
1416 *
c41564b5 1417 * The *QUOTA_ON checks below may look pretty racy, but quotachecks
1da177e4
LT
1418 * and quotaoffs don't race. (Quotachecks happen at mount time only).
1419 */
1420 if (XFS_IS_UQUOTA_ON(mp)) {
52fda114
CH
1421 error = xfs_qm_quotacheck_dqadjust(ip, ip->i_d.di_uid,
1422 XFS_DQ_USER, nblks, rtblks);
1423 if (error)
1424 goto error0;
1da177e4 1425 }
52fda114
CH
1426
1427 if (XFS_IS_GQUOTA_ON(mp)) {
1428 error = xfs_qm_quotacheck_dqadjust(ip, ip->i_d.di_gid,
1429 XFS_DQ_GROUP, nblks, rtblks);
1430 if (error)
1431 goto error0;
1da177e4 1432 }
1da177e4 1433
52fda114 1434 if (XFS_IS_PQUOTA_ON(mp)) {
6743099c 1435 error = xfs_qm_quotacheck_dqadjust(ip, xfs_get_projid(ip),
52fda114
CH
1436 XFS_DQ_PROJ, nblks, rtblks);
1437 if (error)
1438 goto error0;
1439 }
1440
1441 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1442 IRELE(ip);
1da177e4 1443 *res = BULKSTAT_RV_DIDONE;
014c2544 1444 return 0;
52fda114
CH
1445
1446error0:
1447 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1448 IRELE(ip);
1449 *res = BULKSTAT_RV_GIVEUP;
1450 return error;
1da177e4
LT
1451}
1452
b84a3a96
CH
1453STATIC int
1454xfs_qm_flush_one(
43ff2122
CH
1455 struct xfs_dquot *dqp,
1456 void *data)
b84a3a96 1457{
43ff2122 1458 struct list_head *buffer_list = data;
fe7257fd 1459 struct xfs_buf *bp = NULL;
b84a3a96
CH
1460 int error = 0;
1461
1462 xfs_dqlock(dqp);
1463 if (dqp->dq_flags & XFS_DQ_FREEING)
1464 goto out_unlock;
1465 if (!XFS_DQ_IS_DIRTY(dqp))
1466 goto out_unlock;
1467
43ff2122 1468 xfs_dqflock(dqp);
fe7257fd
CH
1469 error = xfs_qm_dqflush(dqp, &bp);
1470 if (error)
1471 goto out_unlock;
b84a3a96 1472
43ff2122 1473 xfs_buf_delwri_queue(bp, buffer_list);
fe7257fd 1474 xfs_buf_relse(bp);
b84a3a96
CH
1475out_unlock:
1476 xfs_dqunlock(dqp);
1477 return error;
1478}
1479
1da177e4
LT
1480/*
1481 * Walk thru all the filesystem inodes and construct a consistent view
1482 * of the disk quota world. If the quotacheck fails, disable quotas.
1483 */
1484int
1485xfs_qm_quotacheck(
1486 xfs_mount_t *mp)
1487{
113a5683
CS
1488 int done, count, error, error2;
1489 xfs_ino_t lastino;
1490 size_t structsz;
1491 uint flags;
1492 LIST_HEAD (buffer_list);
1493 struct xfs_inode *uip = mp->m_quotainfo->qi_uquotaip;
1494 struct xfs_inode *gip = mp->m_quotainfo->qi_gquotaip;
92f8ff73 1495 struct xfs_inode *pip = mp->m_quotainfo->qi_pquotaip;
1da177e4
LT
1496
1497 count = INT_MAX;
1498 structsz = 1;
1499 lastino = 0;
1500 flags = 0;
1501
92f8ff73 1502 ASSERT(uip || gip || pip);
1da177e4
LT
1503 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1504
0b932ccc 1505 xfs_notice(mp, "Quotacheck needed: Please wait.");
1da177e4
LT
1506
1507 /*
c8ad20ff 1508 * First we go thru all the dquots on disk, USR and GRP/PRJ, and reset
1da177e4
LT
1509 * their counters to zero. We need a clean slate.
1510 * We don't log our changes till later.
1511 */
8a7b8a89 1512 if (uip) {
43ff2122
CH
1513 error = xfs_qm_dqiterate(mp, uip, XFS_QMOPT_UQUOTA,
1514 &buffer_list);
8a7b8a89 1515 if (error)
1da177e4
LT
1516 goto error_return;
1517 flags |= XFS_UQUOTA_CHKD;
1518 }
1519
8a7b8a89 1520 if (gip) {
92f8ff73 1521 error = xfs_qm_dqiterate(mp, gip, XFS_QMOPT_GQUOTA,
43ff2122 1522 &buffer_list);
8a7b8a89 1523 if (error)
1da177e4 1524 goto error_return;
92f8ff73
CS
1525 flags |= XFS_GQUOTA_CHKD;
1526 }
1527
1528 if (pip) {
1529 error = xfs_qm_dqiterate(mp, pip, XFS_QMOPT_PQUOTA,
1530 &buffer_list);
1531 if (error)
1532 goto error_return;
1533 flags |= XFS_PQUOTA_CHKD;
1da177e4
LT
1534 }
1535
1536 do {
1537 /*
1538 * Iterate thru all the inodes in the file system,
1539 * adjusting the corresponding dquot counters in core.
1540 */
7dce11db
CH
1541 error = xfs_bulkstat(mp, &lastino, &count,
1542 xfs_qm_dqusage_adjust,
1543 structsz, NULL, &done);
1544 if (error)
1da177e4
LT
1545 break;
1546
7dce11db 1547 } while (!done);
1da177e4 1548
4b8879df 1549 /*
b84a3a96
CH
1550 * We've made all the changes that we need to make incore. Flush them
1551 * down to disk buffers if everything was updated successfully.
4b8879df 1552 */
43ff2122
CH
1553 if (XFS_IS_UQUOTA_ON(mp)) {
1554 error = xfs_qm_dquot_walk(mp, XFS_DQ_USER, xfs_qm_flush_one,
1555 &buffer_list);
1556 }
b84a3a96 1557 if (XFS_IS_GQUOTA_ON(mp)) {
43ff2122
CH
1558 error2 = xfs_qm_dquot_walk(mp, XFS_DQ_GROUP, xfs_qm_flush_one,
1559 &buffer_list);
b84a3a96
CH
1560 if (!error)
1561 error = error2;
1562 }
1563 if (XFS_IS_PQUOTA_ON(mp)) {
43ff2122
CH
1564 error2 = xfs_qm_dquot_walk(mp, XFS_DQ_PROJ, xfs_qm_flush_one,
1565 &buffer_list);
b84a3a96
CH
1566 if (!error)
1567 error = error2;
1568 }
4b8879df 1569
43ff2122
CH
1570 error2 = xfs_buf_delwri_submit(&buffer_list);
1571 if (!error)
1572 error = error2;
1573
1da177e4
LT
1574 /*
1575 * We can get this error if we couldn't do a dquot allocation inside
1576 * xfs_qm_dqusage_adjust (via bulkstat). We don't care about the
1577 * dirty dquots that might be cached, we just want to get rid of them
1578 * and turn quotaoff. The dquots won't be attached to any of the inodes
1579 * at this point (because we intentionally didn't in dqget_noattach).
1580 */
1581 if (error) {
8112e9dc 1582 xfs_qm_dqpurge_all(mp, XFS_QMOPT_QUOTALL);
1da177e4
LT
1583 goto error_return;
1584 }
1da177e4 1585
1da177e4
LT
1586 /*
1587 * If one type of quotas is off, then it will lose its
1588 * quotachecked status, since we won't be doing accounting for
1589 * that type anymore.
1590 */
4177af3a 1591 mp->m_qflags &= ~XFS_ALL_QUOTA_CHKD;
1da177e4
LT
1592 mp->m_qflags |= flags;
1593
1da177e4 1594 error_return:
43ff2122
CH
1595 while (!list_empty(&buffer_list)) {
1596 struct xfs_buf *bp =
1597 list_first_entry(&buffer_list, struct xfs_buf, b_list);
1598 list_del_init(&bp->b_list);
1599 xfs_buf_relse(bp);
1600 }
1601
1da177e4 1602 if (error) {
0b932ccc
DC
1603 xfs_warn(mp,
1604 "Quotacheck: Unsuccessful (Error %d): Disabling quotas.",
1605 error);
1da177e4
LT
1606 /*
1607 * We must turn off quotas.
1608 */
1609 ASSERT(mp->m_quotainfo != NULL);
1da177e4 1610 xfs_qm_destroy_quotainfo(mp);
31d5577b 1611 if (xfs_mount_reset_sbqflags(mp)) {
0b932ccc
DC
1612 xfs_warn(mp,
1613 "Quotacheck: Failed to reset quota flags.");
31d5577b 1614 }
0b932ccc
DC
1615 } else
1616 xfs_notice(mp, "Quotacheck: Done.");
1da177e4
LT
1617 return (error);
1618}
1619
1620/*
1621 * This is called after the superblock has been read in and we're ready to
1622 * iget the quota inodes.
1623 */
1624STATIC int
1625xfs_qm_init_quotainos(
1626 xfs_mount_t *mp)
1627{
113a5683
CS
1628 struct xfs_inode *uip = NULL;
1629 struct xfs_inode *gip = NULL;
92f8ff73 1630 struct xfs_inode *pip = NULL;
113a5683
CS
1631 int error;
1632 __int64_t sbflags = 0;
1633 uint flags = 0;
1da177e4
LT
1634
1635 ASSERT(mp->m_quotainfo);
1da177e4
LT
1636
1637 /*
1638 * Get the uquota and gquota inodes
1639 */
62118709 1640 if (xfs_sb_version_hasquota(&mp->m_sb)) {
1da177e4
LT
1641 if (XFS_IS_UQUOTA_ON(mp) &&
1642 mp->m_sb.sb_uquotino != NULLFSINO) {
1643 ASSERT(mp->m_sb.sb_uquotino > 0);
113a5683
CS
1644 error = xfs_iget(mp, NULL, mp->m_sb.sb_uquotino,
1645 0, 0, &uip);
1646 if (error)
1da177e4
LT
1647 return XFS_ERROR(error);
1648 }
92f8ff73 1649 if (XFS_IS_GQUOTA_ON(mp) &&
1da177e4
LT
1650 mp->m_sb.sb_gquotino != NULLFSINO) {
1651 ASSERT(mp->m_sb.sb_gquotino > 0);
113a5683
CS
1652 error = xfs_iget(mp, NULL, mp->m_sb.sb_gquotino,
1653 0, 0, &gip);
1654 if (error)
1655 goto error_rele;
1da177e4 1656 }
92f8ff73 1657 if (XFS_IS_PQUOTA_ON(mp) &&
d892d586
CS
1658 mp->m_sb.sb_pquotino != NULLFSINO) {
1659 ASSERT(mp->m_sb.sb_pquotino > 0);
1660 error = xfs_iget(mp, NULL, mp->m_sb.sb_pquotino,
92f8ff73
CS
1661 0, 0, &pip);
1662 if (error)
1663 goto error_rele;
1664 }
1da177e4
LT
1665 } else {
1666 flags |= XFS_QMOPT_SBVERSION;
1667 sbflags |= (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
d892d586
CS
1668 XFS_SB_GQUOTINO | XFS_SB_PQUOTINO |
1669 XFS_SB_QFLAGS);
1da177e4
LT
1670 }
1671
1672 /*
92f8ff73 1673 * Create the three inodes, if they don't exist already. The changes
1da177e4
LT
1674 * made above will get added to a transaction and logged in one of
1675 * the qino_alloc calls below. If the device is readonly,
1676 * temporarily switch to read-write to do this.
1677 */
1678 if (XFS_IS_UQUOTA_ON(mp) && uip == NULL) {
113a5683 1679 error = xfs_qm_qino_alloc(mp, &uip,
1da177e4 1680 sbflags | XFS_SB_UQUOTINO,
113a5683
CS
1681 flags | XFS_QMOPT_UQUOTA);
1682 if (error)
1683 goto error_rele;
1da177e4
LT
1684
1685 flags &= ~XFS_QMOPT_SBVERSION;
1686 }
92f8ff73 1687 if (XFS_IS_GQUOTA_ON(mp) && gip == NULL) {
c8ad20ff 1688 error = xfs_qm_qino_alloc(mp, &gip,
92f8ff73
CS
1689 sbflags | XFS_SB_GQUOTINO,
1690 flags | XFS_QMOPT_GQUOTA);
1691 if (error)
1692 goto error_rele;
1693
1694 flags &= ~XFS_QMOPT_SBVERSION;
1695 }
1696 if (XFS_IS_PQUOTA_ON(mp) && pip == NULL) {
92f8ff73 1697 error = xfs_qm_qino_alloc(mp, &pip,
d892d586 1698 sbflags | XFS_SB_PQUOTINO,
92f8ff73 1699 flags | XFS_QMOPT_PQUOTA);
113a5683
CS
1700 if (error)
1701 goto error_rele;
1da177e4
LT
1702 }
1703
8a7b8a89
CH
1704 mp->m_quotainfo->qi_uquotaip = uip;
1705 mp->m_quotainfo->qi_gquotaip = gip;
92f8ff73 1706 mp->m_quotainfo->qi_pquotaip = pip;
1da177e4 1707
014c2544 1708 return 0;
113a5683
CS
1709
1710error_rele:
1711 if (uip)
1712 IRELE(uip);
1713 if (gip)
1714 IRELE(gip);
92f8ff73
CS
1715 if (pip)
1716 IRELE(pip);
113a5683 1717 return XFS_ERROR(error);
1da177e4
LT
1718}
1719
92b2e5b3
CH
1720STATIC void
1721xfs_qm_dqfree_one(
1722 struct xfs_dquot *dqp)
1723{
1724 struct xfs_mount *mp = dqp->q_mount;
1725 struct xfs_quotainfo *qi = mp->m_quotainfo;
1da177e4 1726
9f920f11 1727 mutex_lock(&qi->qi_tree_lock);
329e0875 1728 radix_tree_delete(xfs_dquot_tree(qi, dqp->q_core.d_flags),
9f920f11 1729 be32_to_cpu(dqp->q_core.d_id));
368e1361 1730
92b2e5b3 1731 qi->qi_dquots--;
b84a3a96 1732 mutex_unlock(&qi->qi_tree_lock);
92b2e5b3
CH
1733
1734 xfs_qm_dqdestroy(dqp);
1735}
1736
1da177e4
LT
1737/*
1738 * Start a transaction and write the incore superblock changes to
1739 * disk. flags parameter indicates which fields have changed.
1740 */
1741int
1742xfs_qm_write_sb_changes(
1743 xfs_mount_t *mp,
1744 __int64_t flags)
1745{
1746 xfs_trans_t *tp;
1747 int error;
1748
1da177e4 1749 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_SBCHANGE);
3d3c8b52 1750 error = xfs_trans_reserve(tp, &M_RES(mp)->tr_qm_sbchange, 0, 0);
f910a8c6 1751 if (error) {
1da177e4 1752 xfs_trans_cancel(tp, 0);
014c2544 1753 return error;
1da177e4
LT
1754 }
1755
1756 xfs_mod_sb(tp, flags);
e5720eec 1757 error = xfs_trans_commit(tp, 0);
1da177e4 1758
e5720eec 1759 return error;
1da177e4
LT
1760}
1761
1762
1763/* --------------- utility functions for vnodeops ---------------- */
1764
1765
1766/*
6c77b0ea 1767 * Given an inode, a uid, gid and prid make sure that we have
1da177e4
LT
1768 * allocated relevant dquot(s) on disk, and that we won't exceed inode
1769 * quotas by creating this file.
1770 * This also attaches dquot(s) to the given inode after locking it,
1771 * and returns the dquots corresponding to the uid and/or gid.
1772 *
1773 * in : inode (unlocked)
1774 * out : udquot, gdquot with references taken and unlocked
1775 */
1776int
1777xfs_qm_vop_dqalloc(
7d095257 1778 struct xfs_inode *ip,
7aab1b28
DE
1779 xfs_dqid_t uid,
1780 xfs_dqid_t gid,
7d095257
CH
1781 prid_t prid,
1782 uint flags,
1783 struct xfs_dquot **O_udqpp,
92f8ff73
CS
1784 struct xfs_dquot **O_gdqpp,
1785 struct xfs_dquot **O_pdqpp)
1da177e4 1786{
7d095257 1787 struct xfs_mount *mp = ip->i_mount;
113a5683
CS
1788 struct xfs_dquot *uq = NULL;
1789 struct xfs_dquot *gq = NULL;
92f8ff73 1790 struct xfs_dquot *pq = NULL;
7d095257
CH
1791 int error;
1792 uint lockflags;
1da177e4 1793
7d095257 1794 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
1da177e4
LT
1795 return 0;
1796
1797 lockflags = XFS_ILOCK_EXCL;
1798 xfs_ilock(ip, lockflags);
1799
bd186aa9 1800 if ((flags & XFS_QMOPT_INHERIT) && XFS_INHERIT_GID(ip))
1da177e4
LT
1801 gid = ip->i_d.di_gid;
1802
1803 /*
1804 * Attach the dquot(s) to this inode, doing a dquot allocation
1805 * if necessary. The dquot(s) will not be locked.
1806 */
1807 if (XFS_NOT_DQATTACHED(mp, ip)) {
7d095257
CH
1808 error = xfs_qm_dqattach_locked(ip, XFS_QMOPT_DQALLOC);
1809 if (error) {
1da177e4 1810 xfs_iunlock(ip, lockflags);
014c2544 1811 return error;
1da177e4
LT
1812 }
1813 }
1814
c8ad20ff 1815 if ((flags & XFS_QMOPT_UQUOTA) && XFS_IS_UQUOTA_ON(mp)) {
1da177e4
LT
1816 if (ip->i_d.di_uid != uid) {
1817 /*
1818 * What we need is the dquot that has this uid, and
1819 * if we send the inode to dqget, the uid of the inode
1820 * takes priority over what's sent in the uid argument.
1821 * We must unlock inode here before calling dqget if
1822 * we're not sending the inode, because otherwise
1823 * we'll deadlock by doing trans_reserve while
1824 * holding ilock.
1825 */
1826 xfs_iunlock(ip, lockflags);
7aab1b28 1827 error = xfs_qm_dqget(mp, NULL, uid,
1da177e4
LT
1828 XFS_DQ_USER,
1829 XFS_QMOPT_DQALLOC |
1830 XFS_QMOPT_DOWARN,
113a5683
CS
1831 &uq);
1832 if (error) {
1da177e4 1833 ASSERT(error != ENOENT);
014c2544 1834 return error;
1da177e4
LT
1835 }
1836 /*
1837 * Get the ilock in the right order.
1838 */
1839 xfs_dqunlock(uq);
1840 lockflags = XFS_ILOCK_SHARED;
1841 xfs_ilock(ip, lockflags);
1842 } else {
1843 /*
1844 * Take an extra reference, because we'll return
1845 * this to caller
1846 */
1847 ASSERT(ip->i_udquot);
78e55892 1848 uq = xfs_qm_dqhold(ip->i_udquot);
1da177e4
LT
1849 }
1850 }
c8ad20ff 1851 if ((flags & XFS_QMOPT_GQUOTA) && XFS_IS_GQUOTA_ON(mp)) {
1da177e4
LT
1852 if (ip->i_d.di_gid != gid) {
1853 xfs_iunlock(ip, lockflags);
7aab1b28 1854 error = xfs_qm_dqget(mp, NULL, gid,
1da177e4
LT
1855 XFS_DQ_GROUP,
1856 XFS_QMOPT_DQALLOC |
1857 XFS_QMOPT_DOWARN,
113a5683
CS
1858 &gq);
1859 if (error) {
1da177e4 1860 ASSERT(error != ENOENT);
113a5683 1861 goto error_rele;
1da177e4
LT
1862 }
1863 xfs_dqunlock(gq);
1864 lockflags = XFS_ILOCK_SHARED;
1865 xfs_ilock(ip, lockflags);
1866 } else {
1867 ASSERT(ip->i_gdquot);
78e55892 1868 gq = xfs_qm_dqhold(ip->i_gdquot);
1da177e4 1869 }
92f8ff73
CS
1870 }
1871 if ((flags & XFS_QMOPT_PQUOTA) && XFS_IS_PQUOTA_ON(mp)) {
6743099c 1872 if (xfs_get_projid(ip) != prid) {
c8ad20ff 1873 xfs_iunlock(ip, lockflags);
113a5683 1874 error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t)prid,
c8ad20ff
NS
1875 XFS_DQ_PROJ,
1876 XFS_QMOPT_DQALLOC |
1877 XFS_QMOPT_DOWARN,
92f8ff73 1878 &pq);
113a5683 1879 if (error) {
c8ad20ff 1880 ASSERT(error != ENOENT);
113a5683 1881 goto error_rele;
c8ad20ff 1882 }
92f8ff73 1883 xfs_dqunlock(pq);
c8ad20ff
NS
1884 lockflags = XFS_ILOCK_SHARED;
1885 xfs_ilock(ip, lockflags);
1886 } else {
92f8ff73
CS
1887 ASSERT(ip->i_pdquot);
1888 pq = xfs_qm_dqhold(ip->i_pdquot);
c8ad20ff 1889 }
1da177e4
LT
1890 }
1891 if (uq)
0b1b213f 1892 trace_xfs_dquot_dqalloc(ip);
1da177e4
LT
1893
1894 xfs_iunlock(ip, lockflags);
1895 if (O_udqpp)
1896 *O_udqpp = uq;
1897 else if (uq)
1898 xfs_qm_dqrele(uq);
1899 if (O_gdqpp)
1900 *O_gdqpp = gq;
1901 else if (gq)
1902 xfs_qm_dqrele(gq);
92f8ff73
CS
1903 if (O_pdqpp)
1904 *O_pdqpp = pq;
1905 else if (pq)
1906 xfs_qm_dqrele(pq);
014c2544 1907 return 0;
113a5683
CS
1908
1909error_rele:
92f8ff73
CS
1910 if (gq)
1911 xfs_qm_dqrele(gq);
113a5683
CS
1912 if (uq)
1913 xfs_qm_dqrele(uq);
1914 return error;
1da177e4
LT
1915}
1916
1917/*
1918 * Actually transfer ownership, and do dquot modifications.
1919 * These were already reserved.
1920 */
1921xfs_dquot_t *
1922xfs_qm_vop_chown(
1923 xfs_trans_t *tp,
1924 xfs_inode_t *ip,
1925 xfs_dquot_t **IO_olddq,
1926 xfs_dquot_t *newdq)
1927{
1928 xfs_dquot_t *prevdq;
06d10dd9
NS
1929 uint bfield = XFS_IS_REALTIME_INODE(ip) ?
1930 XFS_TRANS_DQ_RTBCOUNT : XFS_TRANS_DQ_BCOUNT;
1931
7d095257 1932
579aa9ca 1933 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
1934 ASSERT(XFS_IS_QUOTA_RUNNING(ip->i_mount));
1935
1936 /* old dquot */
1937 prevdq = *IO_olddq;
1938 ASSERT(prevdq);
1939 ASSERT(prevdq != newdq);
1940
06d10dd9
NS
1941 xfs_trans_mod_dquot(tp, prevdq, bfield, -(ip->i_d.di_nblocks));
1942 xfs_trans_mod_dquot(tp, prevdq, XFS_TRANS_DQ_ICOUNT, -1);
1da177e4
LT
1943
1944 /* the sparkling new dquot */
06d10dd9
NS
1945 xfs_trans_mod_dquot(tp, newdq, bfield, ip->i_d.di_nblocks);
1946 xfs_trans_mod_dquot(tp, newdq, XFS_TRANS_DQ_ICOUNT, 1);
1da177e4
LT
1947
1948 /*
78e55892
CH
1949 * Take an extra reference, because the inode is going to keep
1950 * this dquot pointer even after the trans_commit.
1da177e4 1951 */
78e55892 1952 *IO_olddq = xfs_qm_dqhold(newdq);
1da177e4 1953
014c2544 1954 return prevdq;
1da177e4
LT
1955}
1956
1957/*
c8ad20ff 1958 * Quota reservations for setattr(AT_UID|AT_GID|AT_PROJID).
1da177e4
LT
1959 */
1960int
1961xfs_qm_vop_chown_reserve(
113a5683
CS
1962 struct xfs_trans *tp,
1963 struct xfs_inode *ip,
1964 struct xfs_dquot *udqp,
1965 struct xfs_dquot *gdqp,
92f8ff73 1966 struct xfs_dquot *pdqp,
113a5683 1967 uint flags)
1da177e4 1968{
113a5683
CS
1969 struct xfs_mount *mp = ip->i_mount;
1970 uint delblks, blkflags, prjflags = 0;
1971 struct xfs_dquot *udq_unres = NULL;
1972 struct xfs_dquot *gdq_unres = NULL;
92f8ff73 1973 struct xfs_dquot *pdq_unres = NULL;
113a5683
CS
1974 struct xfs_dquot *udq_delblks = NULL;
1975 struct xfs_dquot *gdq_delblks = NULL;
92f8ff73 1976 struct xfs_dquot *pdq_delblks = NULL;
113a5683 1977 int error;
7d095257 1978
1da177e4 1979
579aa9ca 1980 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL|XFS_ILOCK_SHARED));
1da177e4
LT
1981 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1982
1983 delblks = ip->i_delayed_blks;
06d10dd9
NS
1984 blkflags = XFS_IS_REALTIME_INODE(ip) ?
1985 XFS_QMOPT_RES_RTBLKS : XFS_QMOPT_RES_REGBLKS;
1da177e4
LT
1986
1987 if (XFS_IS_UQUOTA_ON(mp) && udqp &&
7aab1b28 1988 ip->i_d.di_uid != be32_to_cpu(udqp->q_core.d_id)) {
113a5683 1989 udq_delblks = udqp;
1da177e4
LT
1990 /*
1991 * If there are delayed allocation blocks, then we have to
1992 * unreserve those from the old dquot, and add them to the
1993 * new dquot.
1994 */
1995 if (delblks) {
1996 ASSERT(ip->i_udquot);
113a5683 1997 udq_unres = ip->i_udquot;
1da177e4
LT
1998 }
1999 }
92f8ff73
CS
2000 if (XFS_IS_GQUOTA_ON(ip->i_mount) && gdqp &&
2001 ip->i_d.di_gid != be32_to_cpu(gdqp->q_core.d_id)) {
2002 gdq_delblks = gdqp;
2003 if (delblks) {
2004 ASSERT(ip->i_gdquot);
2005 gdq_unres = ip->i_gdquot;
2006 }
2007 }
2008
2009 if (XFS_IS_PQUOTA_ON(ip->i_mount) && pdqp &&
2010 xfs_get_projid(ip) != be32_to_cpu(pdqp->q_core.d_id)) {
2011 prjflags = XFS_QMOPT_ENOSPC;
2012 pdq_delblks = pdqp;
2013 if (delblks) {
2014 ASSERT(ip->i_pdquot);
2015 pdq_unres = ip->i_pdquot;
1da177e4
LT
2016 }
2017 }
2018
113a5683 2019 error = xfs_trans_reserve_quota_bydquots(tp, ip->i_mount,
92f8ff73
CS
2020 udq_delblks, gdq_delblks, pdq_delblks,
2021 ip->i_d.di_nblocks, 1,
113a5683
CS
2022 flags | blkflags | prjflags);
2023 if (error)
2024 return error;
1da177e4
LT
2025
2026 /*
2027 * Do the delayed blks reservations/unreservations now. Since, these
2028 * are done without the help of a transaction, if a reservation fails
2029 * its previous reservations won't be automatically undone by trans
2030 * code. So, we have to do it manually here.
2031 */
2032 if (delblks) {
2033 /*
2034 * Do the reservations first. Unreservation can't fail.
2035 */
92f8ff73
CS
2036 ASSERT(udq_delblks || gdq_delblks || pdq_delblks);
2037 ASSERT(udq_unres || gdq_unres || pdq_unres);
113a5683 2038 error = xfs_trans_reserve_quota_bydquots(NULL, ip->i_mount,
92f8ff73
CS
2039 udq_delblks, gdq_delblks, pdq_delblks,
2040 (xfs_qcnt_t)delblks, 0,
113a5683
CS
2041 flags | blkflags | prjflags);
2042 if (error)
2043 return error;
1da177e4 2044 xfs_trans_reserve_quota_bydquots(NULL, ip->i_mount,
92f8ff73
CS
2045 udq_unres, gdq_unres, pdq_unres,
2046 -((xfs_qcnt_t)delblks), 0, blkflags);
1da177e4
LT
2047 }
2048
2049 return (0);
2050}
2051
2052int
2053xfs_qm_vop_rename_dqattach(
7d095257 2054 struct xfs_inode **i_tab)
1da177e4 2055{
7d095257
CH
2056 struct xfs_mount *mp = i_tab[0]->i_mount;
2057 int i;
1da177e4 2058
7d095257 2059 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
014c2544 2060 return 0;
1da177e4 2061
7d095257
CH
2062 for (i = 0; (i < 4 && i_tab[i]); i++) {
2063 struct xfs_inode *ip = i_tab[i];
2064 int error;
2065
1da177e4
LT
2066 /*
2067 * Watch out for duplicate entries in the table.
2068 */
7d095257
CH
2069 if (i == 0 || ip != i_tab[i-1]) {
2070 if (XFS_NOT_DQATTACHED(mp, ip)) {
1da177e4
LT
2071 error = xfs_qm_dqattach(ip, 0);
2072 if (error)
014c2544 2073 return error;
1da177e4
LT
2074 }
2075 }
2076 }
014c2544 2077 return 0;
1da177e4
LT
2078}
2079
2080void
7d095257
CH
2081xfs_qm_vop_create_dqattach(
2082 struct xfs_trans *tp,
2083 struct xfs_inode *ip,
2084 struct xfs_dquot *udqp,
92f8ff73
CS
2085 struct xfs_dquot *gdqp,
2086 struct xfs_dquot *pdqp)
1da177e4 2087{
7d095257
CH
2088 struct xfs_mount *mp = tp->t_mountp;
2089
2090 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
1da177e4
LT
2091 return;
2092
579aa9ca 2093 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
7d095257 2094 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1da177e4
LT
2095
2096 if (udqp) {
1da177e4 2097 ASSERT(ip->i_udquot == NULL);
7d095257 2098 ASSERT(XFS_IS_UQUOTA_ON(mp));
1149d96a 2099 ASSERT(ip->i_d.di_uid == be32_to_cpu(udqp->q_core.d_id));
78e55892
CH
2100
2101 ip->i_udquot = xfs_qm_dqhold(udqp);
1da177e4
LT
2102 xfs_trans_mod_dquot(tp, udqp, XFS_TRANS_DQ_ICOUNT, 1);
2103 }
2104 if (gdqp) {
1da177e4 2105 ASSERT(ip->i_gdquot == NULL);
92f8ff73
CS
2106 ASSERT(XFS_IS_GQUOTA_ON(mp));
2107 ASSERT(ip->i_d.di_gid == be32_to_cpu(gdqp->q_core.d_id));
78e55892 2108 ip->i_gdquot = xfs_qm_dqhold(gdqp);
1da177e4
LT
2109 xfs_trans_mod_dquot(tp, gdqp, XFS_TRANS_DQ_ICOUNT, 1);
2110 }
92f8ff73
CS
2111 if (pdqp) {
2112 ASSERT(ip->i_pdquot == NULL);
2113 ASSERT(XFS_IS_PQUOTA_ON(mp));
2114 ASSERT(xfs_get_projid(ip) == be32_to_cpu(pdqp->q_core.d_id));
2115
2116 ip->i_pdquot = xfs_qm_dqhold(pdqp);
2117 xfs_trans_mod_dquot(tp, pdqp, XFS_TRANS_DQ_ICOUNT, 1);
2118 }
1da177e4
LT
2119}
2120