xfs: split out EFI/EFD log item format definition
[linux-2.6-block.git] / fs / xfs / xfs_qm.c
CommitLineData
1da177e4 1/*
4ce3121f
NS
2 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
3 * All Rights Reserved.
1da177e4 4 *
4ce3121f
NS
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
1da177e4
LT
7 * published by the Free Software Foundation.
8 *
4ce3121f
NS
9 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
1da177e4 13 *
4ce3121f
NS
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
1da177e4 17 */
1da177e4
LT
18#include "xfs.h"
19#include "xfs_fs.h"
a844f451 20#include "xfs_bit.h"
1da177e4 21#include "xfs_log.h"
1da177e4
LT
22#include "xfs_trans.h"
23#include "xfs_sb.h"
24#include "xfs_ag.h"
1da177e4 25#include "xfs_alloc.h"
1da177e4
LT
26#include "xfs_quota.h"
27#include "xfs_mount.h"
1da177e4
LT
28#include "xfs_bmap_btree.h"
29#include "xfs_ialloc_btree.h"
1da177e4
LT
30#include "xfs_dinode.h"
31#include "xfs_inode.h"
a844f451
NS
32#include "xfs_ialloc.h"
33#include "xfs_itable.h"
1da177e4
LT
34#include "xfs_rtalloc.h"
35#include "xfs_error.h"
a844f451 36#include "xfs_bmap.h"
1da177e4
LT
37#include "xfs_attr.h"
38#include "xfs_buf_item.h"
39#include "xfs_trans_space.h"
40#include "xfs_utils.h"
1da177e4 41#include "xfs_qm.h"
0b1b213f 42#include "xfs_trace.h"
33479e05 43#include "xfs_icache.h"
6fcdc59d 44#include "xfs_cksum.h"
1da177e4
LT
45
46/*
47 * The global quota manager. There is only one of these for the entire
48 * system, _not_ one per file system. XQM keeps track of the overall
49 * quota functionality, including maintaining the freelist and hash
50 * tables of dquots.
51 */
1da177e4 52STATIC int xfs_qm_init_quotainos(xfs_mount_t *);
ba0f32d4 53STATIC int xfs_qm_init_quotainfo(xfs_mount_t *);
1495f230 54STATIC int xfs_qm_shake(struct shrinker *, struct shrink_control *);
1da177e4 55
b84a3a96
CH
56/*
57 * We use the batch lookup interface to iterate over the dquots as it
58 * currently is the only interface into the radix tree code that allows
59 * fuzzy lookups instead of exact matches. Holding the lock over multiple
60 * operations is fine as all callers are used either during mount/umount
61 * or quotaoff.
62 */
63#define XFS_DQ_LOOKUP_BATCH 32
64
65STATIC int
66xfs_qm_dquot_walk(
67 struct xfs_mount *mp,
68 int type,
43ff2122
CH
69 int (*execute)(struct xfs_dquot *dqp, void *data),
70 void *data)
b84a3a96
CH
71{
72 struct xfs_quotainfo *qi = mp->m_quotainfo;
329e0875 73 struct radix_tree_root *tree = xfs_dquot_tree(qi, type);
b84a3a96
CH
74 uint32_t next_index;
75 int last_error = 0;
76 int skipped;
77 int nr_found;
78
79restart:
80 skipped = 0;
81 next_index = 0;
82 nr_found = 0;
83
84 while (1) {
85 struct xfs_dquot *batch[XFS_DQ_LOOKUP_BATCH];
86 int error = 0;
87 int i;
88
89 mutex_lock(&qi->qi_tree_lock);
90 nr_found = radix_tree_gang_lookup(tree, (void **)batch,
91 next_index, XFS_DQ_LOOKUP_BATCH);
92 if (!nr_found) {
93 mutex_unlock(&qi->qi_tree_lock);
94 break;
95 }
96
97 for (i = 0; i < nr_found; i++) {
98 struct xfs_dquot *dqp = batch[i];
99
100 next_index = be32_to_cpu(dqp->q_core.d_id) + 1;
101
43ff2122 102 error = execute(batch[i], data);
b84a3a96
CH
103 if (error == EAGAIN) {
104 skipped++;
105 continue;
106 }
107 if (error && last_error != EFSCORRUPTED)
108 last_error = error;
109 }
110
111 mutex_unlock(&qi->qi_tree_lock);
112
113 /* bail out if the filesystem is corrupted. */
114 if (last_error == EFSCORRUPTED) {
115 skipped = 0;
116 break;
117 }
118 }
119
120 if (skipped) {
121 delay(1);
122 goto restart;
123 }
124
125 return last_error;
126}
127
128
129/*
130 * Purge a dquot from all tracking data structures and free it.
131 */
132STATIC int
133xfs_qm_dqpurge(
43ff2122
CH
134 struct xfs_dquot *dqp,
135 void *data)
b84a3a96
CH
136{
137 struct xfs_mount *mp = dqp->q_mount;
138 struct xfs_quotainfo *qi = mp->m_quotainfo;
139 struct xfs_dquot *gdqp = NULL;
92f8ff73 140 struct xfs_dquot *pdqp = NULL;
b84a3a96
CH
141
142 xfs_dqlock(dqp);
143 if ((dqp->dq_flags & XFS_DQ_FREEING) || dqp->q_nrefs != 0) {
144 xfs_dqunlock(dqp);
145 return EAGAIN;
146 }
147
148 /*
92f8ff73 149 * If this quota has a hint attached, prepare for releasing it now.
b84a3a96
CH
150 */
151 gdqp = dqp->q_gdquot;
152 if (gdqp) {
153 xfs_dqlock(gdqp);
154 dqp->q_gdquot = NULL;
155 }
156
92f8ff73
CS
157 pdqp = dqp->q_pdquot;
158 if (pdqp) {
159 xfs_dqlock(pdqp);
160 dqp->q_pdquot = NULL;
161 }
162
b84a3a96
CH
163 dqp->dq_flags |= XFS_DQ_FREEING;
164
43ff2122 165 xfs_dqflock(dqp);
b84a3a96
CH
166
167 /*
168 * If we are turning this type of quotas off, we don't care
169 * about the dirty metadata sitting in this dquot. OTOH, if
170 * we're unmounting, we do care, so we flush it and wait.
171 */
172 if (XFS_DQ_IS_DIRTY(dqp)) {
fe7257fd
CH
173 struct xfs_buf *bp = NULL;
174 int error;
b84a3a96
CH
175
176 /*
177 * We don't care about getting disk errors here. We need
178 * to purge this dquot anyway, so we go ahead regardless.
179 */
fe7257fd
CH
180 error = xfs_qm_dqflush(dqp, &bp);
181 if (error) {
b84a3a96
CH
182 xfs_warn(mp, "%s: dquot %p flush failed",
183 __func__, dqp);
fe7257fd
CH
184 } else {
185 error = xfs_bwrite(bp);
186 xfs_buf_relse(bp);
187 }
b84a3a96
CH
188 xfs_dqflock(dqp);
189 }
190
191 ASSERT(atomic_read(&dqp->q_pincount) == 0);
192 ASSERT(XFS_FORCED_SHUTDOWN(mp) ||
193 !(dqp->q_logitem.qli_item.li_flags & XFS_LI_IN_AIL));
194
195 xfs_dqfunlock(dqp);
196 xfs_dqunlock(dqp);
197
329e0875 198 radix_tree_delete(xfs_dquot_tree(qi, dqp->q_core.d_flags),
b84a3a96
CH
199 be32_to_cpu(dqp->q_core.d_id));
200 qi->qi_dquots--;
201
202 /*
203 * We move dquots to the freelist as soon as their reference count
204 * hits zero, so it really should be on the freelist here.
205 */
206 mutex_lock(&qi->qi_lru_lock);
207 ASSERT(!list_empty(&dqp->q_lru));
208 list_del_init(&dqp->q_lru);
209 qi->qi_lru_count--;
210 XFS_STATS_DEC(xs_qm_dquot_unused);
211 mutex_unlock(&qi->qi_lru_lock);
212
213 xfs_qm_dqdestroy(dqp);
214
215 if (gdqp)
216 xfs_qm_dqput(gdqp);
92f8ff73
CS
217 if (pdqp)
218 xfs_qm_dqput(pdqp);
b84a3a96
CH
219 return 0;
220}
221
222/*
223 * Purge the dquot cache.
224 */
225void
226xfs_qm_dqpurge_all(
227 struct xfs_mount *mp,
228 uint flags)
229{
230 if (flags & XFS_QMOPT_UQUOTA)
43ff2122 231 xfs_qm_dquot_walk(mp, XFS_DQ_USER, xfs_qm_dqpurge, NULL);
b84a3a96 232 if (flags & XFS_QMOPT_GQUOTA)
43ff2122 233 xfs_qm_dquot_walk(mp, XFS_DQ_GROUP, xfs_qm_dqpurge, NULL);
b84a3a96 234 if (flags & XFS_QMOPT_PQUOTA)
43ff2122 235 xfs_qm_dquot_walk(mp, XFS_DQ_PROJ, xfs_qm_dqpurge, NULL);
b84a3a96
CH
236}
237
1da177e4
LT
238/*
239 * Just destroy the quotainfo structure.
240 */
241void
7d095257
CH
242xfs_qm_unmount(
243 struct xfs_mount *mp)
1da177e4 244{
7d095257 245 if (mp->m_quotainfo) {
8112e9dc 246 xfs_qm_dqpurge_all(mp, XFS_QMOPT_QUOTALL);
1da177e4 247 xfs_qm_destroy_quotainfo(mp);
7d095257 248 }
1da177e4
LT
249}
250
251
252/*
253 * This is called from xfs_mountfs to start quotas and initialize all
254 * necessary data structures like quotainfo. This is also responsible for
255 * running a quotacheck as necessary. We are guaranteed that the superblock
256 * is consistently read in at this point.
53aa7915
DC
257 *
258 * If we fail here, the mount will continue with quota turned off. We don't
259 * need to inidicate success or failure at all.
1da177e4 260 */
53aa7915 261void
1da177e4 262xfs_qm_mount_quotas(
4249023a 263 xfs_mount_t *mp)
1da177e4 264{
1da177e4
LT
265 int error = 0;
266 uint sbf;
267
1da177e4
LT
268 /*
269 * If quotas on realtime volumes is not supported, we disable
270 * quotas immediately.
271 */
272 if (mp->m_sb.sb_rextents) {
0b932ccc 273 xfs_notice(mp, "Cannot turn on quotas for realtime filesystem");
1da177e4
LT
274 mp->m_qflags = 0;
275 goto write_changes;
276 }
277
1da177e4 278 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
155ffd07 279
1da177e4
LT
280 /*
281 * Allocate the quotainfo structure inside the mount struct, and
282 * create quotainode(s), and change/rev superblock if necessary.
283 */
53aa7915
DC
284 error = xfs_qm_init_quotainfo(mp);
285 if (error) {
1da177e4
LT
286 /*
287 * We must turn off quotas.
288 */
289 ASSERT(mp->m_quotainfo == NULL);
290 mp->m_qflags = 0;
291 goto write_changes;
292 }
293 /*
294 * If any of the quotas are not consistent, do a quotacheck.
295 */
4249023a 296 if (XFS_QM_NEED_QUOTACHECK(mp)) {
53aa7915
DC
297 error = xfs_qm_quotacheck(mp);
298 if (error) {
299 /* Quotacheck failed and disabled quotas. */
300 return;
1da177e4 301 }
1da177e4 302 }
646d5bda
DD
303 /*
304 * If one type of quotas is off, then it will lose its
305 * quotachecked status, since we won't be doing accounting for
306 * that type anymore.
307 */
53aa7915 308 if (!XFS_IS_UQUOTA_ON(mp))
646d5bda 309 mp->m_qflags &= ~XFS_UQUOTA_CHKD;
83e782e1
CS
310 if (!XFS_IS_GQUOTA_ON(mp))
311 mp->m_qflags &= ~XFS_GQUOTA_CHKD;
312 if (!XFS_IS_PQUOTA_ON(mp))
313 mp->m_qflags &= ~XFS_PQUOTA_CHKD;
155ffd07 314
1da177e4
LT
315 write_changes:
316 /*
3685c2a1 317 * We actually don't have to acquire the m_sb_lock at all.
1da177e4
LT
318 * This can only be called from mount, and that's single threaded. XXX
319 */
3685c2a1 320 spin_lock(&mp->m_sb_lock);
1da177e4
LT
321 sbf = mp->m_sb.sb_qflags;
322 mp->m_sb.sb_qflags = mp->m_qflags & XFS_MOUNT_QUOTA_ALL;
3685c2a1 323 spin_unlock(&mp->m_sb_lock);
1da177e4
LT
324
325 if (sbf != (mp->m_qflags & XFS_MOUNT_QUOTA_ALL)) {
326 if (xfs_qm_write_sb_changes(mp, XFS_SB_QFLAGS)) {
327 /*
328 * We could only have been turning quotas off.
329 * We aren't in very good shape actually because
330 * the incore structures are convinced that quotas are
331 * off, but the on disk superblock doesn't know that !
332 */
333 ASSERT(!(XFS_IS_QUOTA_RUNNING(mp)));
53487786
DC
334 xfs_alert(mp, "%s: Superblock update failed!",
335 __func__);
1da177e4
LT
336 }
337 }
338
339 if (error) {
53487786 340 xfs_warn(mp, "Failed to initialize disk quotas.");
7d095257 341 return;
1da177e4 342 }
1da177e4
LT
343}
344
345/*
346 * Called from the vfsops layer.
347 */
e57481dc 348void
1da177e4
LT
349xfs_qm_unmount_quotas(
350 xfs_mount_t *mp)
351{
1da177e4
LT
352 /*
353 * Release the dquots that root inode, et al might be holding,
354 * before we flush quotas and blow away the quotainfo structure.
355 */
356 ASSERT(mp->m_rootip);
357 xfs_qm_dqdetach(mp->m_rootip);
358 if (mp->m_rbmip)
359 xfs_qm_dqdetach(mp->m_rbmip);
360 if (mp->m_rsumip)
361 xfs_qm_dqdetach(mp->m_rsumip);
362
363 /*
e57481dc 364 * Release the quota inodes.
1da177e4 365 */
1da177e4 366 if (mp->m_quotainfo) {
e57481dc
CH
367 if (mp->m_quotainfo->qi_uquotaip) {
368 IRELE(mp->m_quotainfo->qi_uquotaip);
369 mp->m_quotainfo->qi_uquotaip = NULL;
1da177e4 370 }
e57481dc
CH
371 if (mp->m_quotainfo->qi_gquotaip) {
372 IRELE(mp->m_quotainfo->qi_gquotaip);
373 mp->m_quotainfo->qi_gquotaip = NULL;
1da177e4 374 }
92f8ff73
CS
375 if (mp->m_quotainfo->qi_pquotaip) {
376 IRELE(mp->m_quotainfo->qi_pquotaip);
377 mp->m_quotainfo->qi_pquotaip = NULL;
378 }
1da177e4 379 }
1da177e4
LT
380}
381
1da177e4
LT
382STATIC int
383xfs_qm_dqattach_one(
384 xfs_inode_t *ip,
385 xfs_dqid_t id,
386 uint type,
387 uint doalloc,
1da177e4
LT
388 xfs_dquot_t *udqhint, /* hint */
389 xfs_dquot_t **IO_idqpp)
390{
391 xfs_dquot_t *dqp;
392 int error;
393
579aa9ca 394 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4 395 error = 0;
8e9b6e7f 396
1da177e4
LT
397 /*
398 * See if we already have it in the inode itself. IO_idqpp is
399 * &i_udquot or &i_gdquot. This made the code look weird, but
400 * made the logic a lot simpler.
401 */
8e9b6e7f
CH
402 dqp = *IO_idqpp;
403 if (dqp) {
0b1b213f 404 trace_xfs_dqattach_found(dqp);
8e9b6e7f 405 return 0;
1da177e4
LT
406 }
407
408 /*
409 * udqhint is the i_udquot field in inode, and is non-NULL only
c8ad20ff 410 * when the type arg is group/project. Its purpose is to save a
1da177e4
LT
411 * lookup by dqid (xfs_qm_dqget) by caching a group dquot inside
412 * the user dquot.
413 */
8e9b6e7f
CH
414 if (udqhint) {
415 ASSERT(type == XFS_DQ_GROUP || type == XFS_DQ_PROJ);
1da177e4
LT
416 xfs_dqlock(udqhint);
417
8e9b6e7f
CH
418 /*
419 * No need to take dqlock to look at the id.
420 *
421 * The ID can't change until it gets reclaimed, and it won't
422 * be reclaimed as long as we have a ref from inode and we
423 * hold the ilock.
424 */
92f8ff73
CS
425 if (type == XFS_DQ_GROUP)
426 dqp = udqhint->q_gdquot;
427 else
428 dqp = udqhint->q_pdquot;
8e9b6e7f 429 if (dqp && be32_to_cpu(dqp->q_core.d_id) == id) {
8e9b6e7f 430 ASSERT(*IO_idqpp == NULL);
8e9b6e7f 431
78e55892 432 *IO_idqpp = xfs_qm_dqhold(dqp);
1da177e4 433 xfs_dqunlock(udqhint);
8e9b6e7f 434 return 0;
1da177e4 435 }
8e9b6e7f
CH
436
437 /*
438 * We can't hold a dquot lock when we call the dqget code.
439 * We'll deadlock in no time, because of (not conforming to)
440 * lock ordering - the inodelock comes before any dquot lock,
441 * and we may drop and reacquire the ilock in xfs_qm_dqget().
442 */
1da177e4 443 xfs_dqunlock(udqhint);
8e9b6e7f
CH
444 }
445
1da177e4
LT
446 /*
447 * Find the dquot from somewhere. This bumps the
448 * reference count of dquot and returns it locked.
449 * This can return ENOENT if dquot didn't exist on
450 * disk and we didn't ask it to allocate;
451 * ESRCH if quotas got turned off suddenly.
452 */
db3e74b5
MH
453 error = xfs_qm_dqget(ip->i_mount, ip, id, type,
454 doalloc | XFS_QMOPT_DOWARN, &dqp);
8e9b6e7f
CH
455 if (error)
456 return error;
1da177e4 457
0b1b213f 458 trace_xfs_dqattach_get(dqp);
8e9b6e7f 459
1da177e4
LT
460 /*
461 * dqget may have dropped and re-acquired the ilock, but it guarantees
462 * that the dquot returned is the one that should go in the inode.
463 */
464 *IO_idqpp = dqp;
8e9b6e7f
CH
465 xfs_dqunlock(dqp);
466 return 0;
1da177e4
LT
467}
468
469
470/*
92f8ff73
CS
471 * Given a udquot and group/project type, attach the group/project
472 * dquot pointer to the udquot as a hint for future lookups.
1da177e4
LT
473 */
474STATIC void
92f8ff73
CS
475xfs_qm_dqattach_hint(
476 struct xfs_inode *ip,
477 int type)
1da177e4 478{
92f8ff73
CS
479 struct xfs_dquot **dqhintp;
480 struct xfs_dquot *dqp;
481 struct xfs_dquot *udq = ip->i_udquot;
482
483 ASSERT(type == XFS_DQ_GROUP || type == XFS_DQ_PROJ);
1da177e4 484
8e9b6e7f 485 xfs_dqlock(udq);
1da177e4 486
92f8ff73
CS
487 if (type == XFS_DQ_GROUP) {
488 dqp = ip->i_gdquot;
489 dqhintp = &udq->q_gdquot;
490 } else {
491 dqp = ip->i_pdquot;
492 dqhintp = &udq->q_pdquot;
493 }
494
495 if (*dqhintp) {
496 struct xfs_dquot *tmp;
497
498 if (*dqhintp == dqp)
ab680bb7 499 goto done;
1da177e4 500
92f8ff73
CS
501 tmp = *dqhintp;
502 *dqhintp = NULL;
1da177e4 503 xfs_qm_dqrele(tmp);
1da177e4 504 }
8e9b6e7f 505
92f8ff73 506 *dqhintp = xfs_qm_dqhold(dqp);
ab680bb7 507done:
8e9b6e7f 508 xfs_dqunlock(udq);
1da177e4
LT
509}
510
b4d05e30
CH
511static bool
512xfs_qm_need_dqattach(
513 struct xfs_inode *ip)
514{
515 struct xfs_mount *mp = ip->i_mount;
516
517 if (!XFS_IS_QUOTA_RUNNING(mp))
518 return false;
519 if (!XFS_IS_QUOTA_ON(mp))
520 return false;
521 if (!XFS_NOT_DQATTACHED(mp, ip))
522 return false;
9cad19d2 523 if (xfs_is_quota_inode(&mp->m_sb, ip->i_ino))
b4d05e30
CH
524 return false;
525 return true;
526}
1da177e4
LT
527
528/*
c8ad20ff
NS
529 * Given a locked inode, attach dquot(s) to it, taking U/G/P-QUOTAON
530 * into account.
1da177e4 531 * If XFS_QMOPT_DQALLOC, the dquot(s) will be allocated if needed.
1da177e4
LT
532 * Inode may get unlocked and relocked in here, and the caller must deal with
533 * the consequences.
534 */
535int
7d095257 536xfs_qm_dqattach_locked(
1da177e4
LT
537 xfs_inode_t *ip,
538 uint flags)
539{
540 xfs_mount_t *mp = ip->i_mount;
541 uint nquotas = 0;
542 int error = 0;
543
b4d05e30 544 if (!xfs_qm_need_dqattach(ip))
014c2544 545 return 0;
1da177e4 546
7d095257 547 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
548
549 if (XFS_IS_UQUOTA_ON(mp)) {
550 error = xfs_qm_dqattach_one(ip, ip->i_d.di_uid, XFS_DQ_USER,
551 flags & XFS_QMOPT_DQALLOC,
1da177e4
LT
552 NULL, &ip->i_udquot);
553 if (error)
554 goto done;
555 nquotas++;
556 }
579aa9ca
CH
557
558 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
92f8ff73
CS
559 if (XFS_IS_GQUOTA_ON(mp)) {
560 error = xfs_qm_dqattach_one(ip, ip->i_d.di_gid, XFS_DQ_GROUP,
1da177e4 561 flags & XFS_QMOPT_DQALLOC,
1da177e4
LT
562 ip->i_udquot, &ip->i_gdquot);
563 /*
564 * Don't worry about the udquot that we may have
565 * attached above. It'll get detached, if not already.
566 */
567 if (error)
568 goto done;
569 nquotas++;
570 }
571
92f8ff73
CS
572 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
573 if (XFS_IS_PQUOTA_ON(mp)) {
574 error = xfs_qm_dqattach_one(ip, xfs_get_projid(ip), XFS_DQ_PROJ,
575 flags & XFS_QMOPT_DQALLOC,
576 ip->i_udquot, &ip->i_pdquot);
577 /*
578 * Don't worry about the udquot that we may have
579 * attached above. It'll get detached, if not already.
580 */
581 if (error)
582 goto done;
583 nquotas++;
584 }
585
1da177e4 586 /*
92f8ff73 587 * Attach this group/project quota to the user quota as a hint.
1da177e4
LT
588 * This WON'T, in general, result in a thrash.
589 */
92f8ff73 590 if (nquotas > 1 && ip->i_udquot) {
579aa9ca 591 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
92f8ff73
CS
592 ASSERT(ip->i_gdquot || !XFS_IS_GQUOTA_ON(mp));
593 ASSERT(ip->i_pdquot || !XFS_IS_PQUOTA_ON(mp));
1da177e4
LT
594
595 /*
ab680bb7
CH
596 * We do not have i_udquot locked at this point, but this check
597 * is OK since we don't depend on the i_gdquot to be accurate
598 * 100% all the time. It is just a hint, and this will
599 * succeed in general.
1da177e4 600 */
ab680bb7 601 if (ip->i_udquot->q_gdquot != ip->i_gdquot)
92f8ff73
CS
602 xfs_qm_dqattach_hint(ip, XFS_DQ_GROUP);
603
604 if (ip->i_udquot->q_pdquot != ip->i_pdquot)
605 xfs_qm_dqattach_hint(ip, XFS_DQ_PROJ);
1da177e4
LT
606 }
607
7d095257 608 done:
ea15ab3c
CH
609#ifdef DEBUG
610 if (!error) {
1da177e4
LT
611 if (XFS_IS_UQUOTA_ON(mp))
612 ASSERT(ip->i_udquot);
92f8ff73 613 if (XFS_IS_GQUOTA_ON(mp))
1da177e4 614 ASSERT(ip->i_gdquot);
92f8ff73
CS
615 if (XFS_IS_PQUOTA_ON(mp))
616 ASSERT(ip->i_pdquot);
1da177e4 617 }
7d095257 618 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4 619#endif
7d095257
CH
620 return error;
621}
1da177e4 622
7d095257
CH
623int
624xfs_qm_dqattach(
625 struct xfs_inode *ip,
626 uint flags)
627{
628 int error;
629
b4d05e30
CH
630 if (!xfs_qm_need_dqattach(ip))
631 return 0;
632
7d095257
CH
633 xfs_ilock(ip, XFS_ILOCK_EXCL);
634 error = xfs_qm_dqattach_locked(ip, flags);
635 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1da177e4 636
014c2544 637 return error;
1da177e4
LT
638}
639
640/*
641 * Release dquots (and their references) if any.
642 * The inode should be locked EXCL except when this's called by
643 * xfs_ireclaim.
644 */
645void
646xfs_qm_dqdetach(
647 xfs_inode_t *ip)
648{
92f8ff73 649 if (!(ip->i_udquot || ip->i_gdquot || ip->i_pdquot))
1da177e4
LT
650 return;
651
0b1b213f
CH
652 trace_xfs_dquot_dqdetach(ip);
653
9cad19d2 654 ASSERT(!xfs_is_quota_inode(&ip->i_mount->m_sb, ip->i_ino));
1da177e4
LT
655 if (ip->i_udquot) {
656 xfs_qm_dqrele(ip->i_udquot);
657 ip->i_udquot = NULL;
658 }
659 if (ip->i_gdquot) {
660 xfs_qm_dqrele(ip->i_gdquot);
661 ip->i_gdquot = NULL;
662 }
92f8ff73
CS
663 if (ip->i_pdquot) {
664 xfs_qm_dqrele(ip->i_pdquot);
665 ip->i_pdquot = NULL;
666 }
1da177e4
LT
667}
668
3fe58f30
CH
669int
670xfs_qm_calc_dquots_per_chunk(
671 struct xfs_mount *mp,
672 unsigned int nbblks) /* basic block units */
673{
674 unsigned int ndquots;
675
676 ASSERT(nbblks > 0);
677 ndquots = BBTOB(nbblks);
678 do_div(ndquots, sizeof(xfs_dqblk_t));
679
680 return ndquots;
681}
682
1da177e4
LT
683/*
684 * This initializes all the quota information that's kept in the
685 * mount structure
686 */
ba0f32d4 687STATIC int
1da177e4
LT
688xfs_qm_init_quotainfo(
689 xfs_mount_t *mp)
690{
691 xfs_quotainfo_t *qinf;
692 int error;
693 xfs_dquot_t *dqp;
694
695 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
696
1da177e4
LT
697 qinf = mp->m_quotainfo = kmem_zalloc(sizeof(xfs_quotainfo_t), KM_SLEEP);
698
699 /*
700 * See if quotainodes are setup, and if not, allocate them,
701 * and change the superblock accordingly.
702 */
703 if ((error = xfs_qm_init_quotainos(mp))) {
f0e2d93c 704 kmem_free(qinf);
1da177e4 705 mp->m_quotainfo = NULL;
014c2544 706 return error;
1da177e4
LT
707 }
708
9f920f11
CH
709 INIT_RADIX_TREE(&qinf->qi_uquota_tree, GFP_NOFS);
710 INIT_RADIX_TREE(&qinf->qi_gquota_tree, GFP_NOFS);
92f8ff73 711 INIT_RADIX_TREE(&qinf->qi_pquota_tree, GFP_NOFS);
9f920f11
CH
712 mutex_init(&qinf->qi_tree_lock);
713
f8739c3c
CH
714 INIT_LIST_HEAD(&qinf->qi_lru_list);
715 qinf->qi_lru_count = 0;
716 mutex_init(&qinf->qi_lru_lock);
717
1da177e4 718 /* mutex used to serialize quotaoffs */
794ee1ba 719 mutex_init(&qinf->qi_quotaofflock);
1da177e4
LT
720
721 /* Precalc some constants */
722 qinf->qi_dqchunklen = XFS_FSB_TO_BB(mp, XFS_DQUOT_CLUSTER_SIZE_FSB);
3fe58f30
CH
723 qinf->qi_dqperchunk = xfs_qm_calc_dquots_per_chunk(mp,
724 qinf->qi_dqchunklen);
1da177e4
LT
725
726 mp->m_qflags |= (mp->m_sb.sb_qflags & XFS_ALL_QUOTA_CHKD);
727
728 /*
729 * We try to get the limits from the superuser's limits fields.
730 * This is quite hacky, but it is standard quota practice.
7ae44407 731 *
1da177e4
LT
732 * We look at the USR dquot with id == 0 first, but if user quotas
733 * are not enabled we goto the GRP dquot with id == 0.
734 * We don't really care to keep separate default limits for user
735 * and group quotas, at least not at this point.
7ae44407
CH
736 *
737 * Since we may not have done a quotacheck by this point, just read
738 * the dquot without attaching it to any hashtables or lists.
1da177e4 739 */
7ae44407
CH
740 error = xfs_qm_dqread(mp, 0,
741 XFS_IS_UQUOTA_RUNNING(mp) ? XFS_DQ_USER :
742 (XFS_IS_GQUOTA_RUNNING(mp) ? XFS_DQ_GROUP :
743 XFS_DQ_PROJ),
744 XFS_QMOPT_DOWARN, &dqp);
745 if (!error) {
1da177e4
LT
746 xfs_disk_dquot_t *ddqp = &dqp->q_core;
747
748 /*
749 * The warnings and timers set the grace period given to
750 * a user or group before he or she can not perform any
751 * more writing. If it is zero, a default is used.
752 */
1149d96a
CH
753 qinf->qi_btimelimit = ddqp->d_btimer ?
754 be32_to_cpu(ddqp->d_btimer) : XFS_QM_BTIMELIMIT;
755 qinf->qi_itimelimit = ddqp->d_itimer ?
756 be32_to_cpu(ddqp->d_itimer) : XFS_QM_ITIMELIMIT;
757 qinf->qi_rtbtimelimit = ddqp->d_rtbtimer ?
758 be32_to_cpu(ddqp->d_rtbtimer) : XFS_QM_RTBTIMELIMIT;
759 qinf->qi_bwarnlimit = ddqp->d_bwarns ?
760 be16_to_cpu(ddqp->d_bwarns) : XFS_QM_BWARNLIMIT;
761 qinf->qi_iwarnlimit = ddqp->d_iwarns ?
762 be16_to_cpu(ddqp->d_iwarns) : XFS_QM_IWARNLIMIT;
763 qinf->qi_rtbwarnlimit = ddqp->d_rtbwarns ?
764 be16_to_cpu(ddqp->d_rtbwarns) : XFS_QM_RTBWARNLIMIT;
765 qinf->qi_bhardlimit = be64_to_cpu(ddqp->d_blk_hardlimit);
766 qinf->qi_bsoftlimit = be64_to_cpu(ddqp->d_blk_softlimit);
767 qinf->qi_ihardlimit = be64_to_cpu(ddqp->d_ino_hardlimit);
768 qinf->qi_isoftlimit = be64_to_cpu(ddqp->d_ino_softlimit);
769 qinf->qi_rtbhardlimit = be64_to_cpu(ddqp->d_rtb_hardlimit);
770 qinf->qi_rtbsoftlimit = be64_to_cpu(ddqp->d_rtb_softlimit);
1da177e4 771
1da177e4
LT
772 xfs_qm_dqdestroy(dqp);
773 } else {
774 qinf->qi_btimelimit = XFS_QM_BTIMELIMIT;
775 qinf->qi_itimelimit = XFS_QM_ITIMELIMIT;
776 qinf->qi_rtbtimelimit = XFS_QM_RTBTIMELIMIT;
777 qinf->qi_bwarnlimit = XFS_QM_BWARNLIMIT;
778 qinf->qi_iwarnlimit = XFS_QM_IWARNLIMIT;
06d10dd9 779 qinf->qi_rtbwarnlimit = XFS_QM_RTBWARNLIMIT;
1da177e4
LT
780 }
781
f8739c3c
CH
782 qinf->qi_shrinker.shrink = xfs_qm_shake;
783 qinf->qi_shrinker.seeks = DEFAULT_SEEKS;
784 register_shrinker(&qinf->qi_shrinker);
014c2544 785 return 0;
1da177e4
LT
786}
787
788
789/*
790 * Gets called when unmounting a filesystem or when all quotas get
791 * turned off.
792 * This purges the quota inodes, destroys locks and frees itself.
793 */
794void
795xfs_qm_destroy_quotainfo(
796 xfs_mount_t *mp)
797{
798 xfs_quotainfo_t *qi;
799
800 qi = mp->m_quotainfo;
801 ASSERT(qi != NULL);
1da177e4 802
f8739c3c
CH
803 unregister_shrinker(&qi->qi_shrinker);
804
1da177e4 805 if (qi->qi_uquotaip) {
26cc0021 806 IRELE(qi->qi_uquotaip);
1da177e4
LT
807 qi->qi_uquotaip = NULL; /* paranoia */
808 }
809 if (qi->qi_gquotaip) {
26cc0021 810 IRELE(qi->qi_gquotaip);
1da177e4
LT
811 qi->qi_gquotaip = NULL;
812 }
92f8ff73
CS
813 if (qi->qi_pquotaip) {
814 IRELE(qi->qi_pquotaip);
815 qi->qi_pquotaip = NULL;
816 }
1da177e4 817 mutex_destroy(&qi->qi_quotaofflock);
f0e2d93c 818 kmem_free(qi);
1da177e4
LT
819 mp->m_quotainfo = NULL;
820}
821
1da177e4
LT
822/*
823 * Create an inode and return with a reference already taken, but unlocked
824 * This is how we create quota inodes
825 */
826STATIC int
827xfs_qm_qino_alloc(
828 xfs_mount_t *mp,
829 xfs_inode_t **ip,
830 __int64_t sbfields,
831 uint flags)
832{
833 xfs_trans_t *tp;
834 int error;
1da177e4
LT
835 int committed;
836
d892d586
CS
837 *ip = NULL;
838 /*
839 * With superblock that doesn't have separate pquotino, we
840 * share an inode between gquota and pquota. If the on-disk
841 * superblock has GQUOTA and the filesystem is now mounted
842 * with PQUOTA, just use sb_gquotino for sb_pquotino and
843 * vice-versa.
844 */
845 if (!xfs_sb_version_has_pquotino(&mp->m_sb) &&
846 (flags & (XFS_QMOPT_PQUOTA|XFS_QMOPT_GQUOTA))) {
847 xfs_ino_t ino = NULLFSINO;
848
849 if ((flags & XFS_QMOPT_PQUOTA) &&
850 (mp->m_sb.sb_gquotino != NULLFSINO)) {
851 ino = mp->m_sb.sb_gquotino;
852 ASSERT(mp->m_sb.sb_pquotino == NULLFSINO);
853 } else if ((flags & XFS_QMOPT_GQUOTA) &&
854 (mp->m_sb.sb_pquotino != NULLFSINO)) {
855 ino = mp->m_sb.sb_pquotino;
856 ASSERT(mp->m_sb.sb_gquotino == NULLFSINO);
857 }
858 if (ino != NULLFSINO) {
859 error = xfs_iget(mp, NULL, ino, 0, 0, ip);
860 if (error)
861 return error;
862 mp->m_sb.sb_gquotino = NULLFSINO;
863 mp->m_sb.sb_pquotino = NULLFSINO;
864 }
865 }
866
061f7209 867 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_QINOCREATE);
1da177e4
LT
868 if ((error = xfs_trans_reserve(tp,
869 XFS_QM_QINOCREATE_SPACE_RES(mp),
870 XFS_CREATE_LOG_RES(mp), 0,
871 XFS_TRANS_PERM_LOG_RES,
872 XFS_CREATE_LOG_COUNT))) {
873 xfs_trans_cancel(tp, 0);
014c2544 874 return error;
1da177e4 875 }
1da177e4 876
d892d586
CS
877 if (!*ip) {
878 error = xfs_dir_ialloc(&tp, NULL, S_IFREG, 1, 0, 0, 1, ip,
879 &committed);
880 if (error) {
881 xfs_trans_cancel(tp, XFS_TRANS_RELEASE_LOG_RES |
882 XFS_TRANS_ABORT);
883 return error;
884 }
1da177e4
LT
885 }
886
1da177e4
LT
887 /*
888 * Make the changes in the superblock, and log those too.
889 * sbfields arg may contain fields other than *QUOTINO;
890 * VERSIONNUM for example.
891 */
3685c2a1 892 spin_lock(&mp->m_sb_lock);
1da177e4 893 if (flags & XFS_QMOPT_SBVERSION) {
62118709 894 ASSERT(!xfs_sb_version_hasquota(&mp->m_sb));
1da177e4 895 ASSERT((sbfields & (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
d892d586
CS
896 XFS_SB_GQUOTINO | XFS_SB_PQUOTINO | XFS_SB_QFLAGS)) ==
897 (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
898 XFS_SB_GQUOTINO | XFS_SB_PQUOTINO |
899 XFS_SB_QFLAGS));
1da177e4 900
62118709 901 xfs_sb_version_addquota(&mp->m_sb);
1da177e4
LT
902 mp->m_sb.sb_uquotino = NULLFSINO;
903 mp->m_sb.sb_gquotino = NULLFSINO;
d892d586 904 mp->m_sb.sb_pquotino = NULLFSINO;
1da177e4 905
d892d586
CS
906 /* qflags will get updated fully _after_ quotacheck */
907 mp->m_sb.sb_qflags = mp->m_qflags & XFS_ALL_QUOTA_ACCT;
1da177e4
LT
908 }
909 if (flags & XFS_QMOPT_UQUOTA)
910 mp->m_sb.sb_uquotino = (*ip)->i_ino;
d892d586 911 else if (flags & XFS_QMOPT_GQUOTA)
1da177e4 912 mp->m_sb.sb_gquotino = (*ip)->i_ino;
d892d586
CS
913 else
914 mp->m_sb.sb_pquotino = (*ip)->i_ino;
3685c2a1 915 spin_unlock(&mp->m_sb_lock);
1da177e4
LT
916 xfs_mod_sb(tp, sbfields);
917
1c72bf90 918 if ((error = xfs_trans_commit(tp, XFS_TRANS_RELEASE_LOG_RES))) {
53487786 919 xfs_alert(mp, "%s failed (error %d)!", __func__, error);
014c2544 920 return error;
1da177e4 921 }
014c2544 922 return 0;
1da177e4
LT
923}
924
925
5b139738 926STATIC void
1da177e4
LT
927xfs_qm_reset_dqcounts(
928 xfs_mount_t *mp,
929 xfs_buf_t *bp,
930 xfs_dqid_t id,
931 uint type)
932{
6fcdc59d 933 struct xfs_dqblk *dqb;
1da177e4
LT
934 int j;
935
0b1b213f
CH
936 trace_xfs_reset_dqcounts(bp, _RET_IP_);
937
1da177e4
LT
938 /*
939 * Reset all counters and timers. They'll be
940 * started afresh by xfs_qm_quotacheck.
941 */
942#ifdef DEBUG
943 j = XFS_FSB_TO_B(mp, XFS_DQUOT_CLUSTER_SIZE_FSB);
944 do_div(j, sizeof(xfs_dqblk_t));
8a7b8a89 945 ASSERT(mp->m_quotainfo->qi_dqperchunk == j);
1da177e4 946#endif
6fcdc59d 947 dqb = bp->b_addr;
8a7b8a89 948 for (j = 0; j < mp->m_quotainfo->qi_dqperchunk; j++) {
6fcdc59d
DC
949 struct xfs_disk_dquot *ddq;
950
951 ddq = (struct xfs_disk_dquot *)&dqb[j];
952
1da177e4
LT
953 /*
954 * Do a sanity check, and if needed, repair the dqblk. Don't
955 * output any warnings because it's perfectly possible to
c41564b5 956 * find uninitialised dquot blks. See comment in xfs_qm_dqcheck.
1da177e4 957 */
a0fa2b67 958 (void) xfs_qm_dqcheck(mp, ddq, id+j, type, XFS_QMOPT_DQREPAIR,
1da177e4 959 "xfs_quotacheck");
1149d96a
CH
960 ddq->d_bcount = 0;
961 ddq->d_icount = 0;
962 ddq->d_rtbcount = 0;
963 ddq->d_btimer = 0;
964 ddq->d_itimer = 0;
965 ddq->d_rtbtimer = 0;
966 ddq->d_bwarns = 0;
967 ddq->d_iwarns = 0;
968 ddq->d_rtbwarns = 0;
6fcdc59d
DC
969
970 if (xfs_sb_version_hascrc(&mp->m_sb)) {
971 xfs_update_cksum((char *)&dqb[j],
972 sizeof(struct xfs_dqblk),
973 XFS_DQUOT_CRC_OFF);
974 }
1da177e4 975 }
1da177e4
LT
976}
977
978STATIC int
979xfs_qm_dqiter_bufs(
43ff2122
CH
980 struct xfs_mount *mp,
981 xfs_dqid_t firstid,
982 xfs_fsblock_t bno,
983 xfs_filblks_t blkcnt,
984 uint flags,
985 struct list_head *buffer_list)
1da177e4 986{
43ff2122
CH
987 struct xfs_buf *bp;
988 int error;
989 int type;
1da177e4
LT
990
991 ASSERT(blkcnt > 0);
c8ad20ff
NS
992 type = flags & XFS_QMOPT_UQUOTA ? XFS_DQ_USER :
993 (flags & XFS_QMOPT_PQUOTA ? XFS_DQ_PROJ : XFS_DQ_GROUP);
1da177e4
LT
994 error = 0;
995
996 /*
997 * Blkcnt arg can be a very big number, and might even be
998 * larger than the log itself. So, we have to break it up into
999 * manageable-sized transactions.
1000 * Note that we don't start a permanent transaction here; we might
1001 * not be able to get a log reservation for the whole thing up front,
1002 * and we don't really care to either, because we just discard
1003 * everything if we were to crash in the middle of this loop.
1004 */
1005 while (blkcnt--) {
1006 error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp,
1007 XFS_FSB_TO_DADDR(mp, bno),
c6319198 1008 mp->m_quotainfo->qi_dqchunklen, 0, &bp,
1813dd64 1009 &xfs_dquot_buf_ops);
1da177e4 1010
3fe58f30 1011 /*
6fcdc59d
DC
1012 * CRC and validation errors will return a EFSCORRUPTED here. If
1013 * this occurs, re-read without CRC validation so that we can
1014 * repair the damage via xfs_qm_reset_dqcounts(). This process
1015 * will leave a trace in the log indicating corruption has
1016 * been detected.
3fe58f30 1017 */
6fcdc59d
DC
1018 if (error == EFSCORRUPTED) {
1019 error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp,
1020 XFS_FSB_TO_DADDR(mp, bno),
1021 mp->m_quotainfo->qi_dqchunklen, 0, &bp,
1022 NULL);
1023 }
1024
1025 if (error)
1026 break;
1027
5b139738 1028 xfs_qm_reset_dqcounts(mp, bp, firstid, type);
43ff2122 1029 xfs_buf_delwri_queue(bp, buffer_list);
61551f1e 1030 xfs_buf_relse(bp);
6fcdc59d
DC
1031
1032 /* goto the next block. */
1da177e4 1033 bno++;
8a7b8a89 1034 firstid += mp->m_quotainfo->qi_dqperchunk;
1da177e4 1035 }
43ff2122 1036
014c2544 1037 return error;
1da177e4
LT
1038}
1039
1040/*
c8ad20ff 1041 * Iterate over all allocated USR/GRP/PRJ dquots in the system, calling a
1da177e4
LT
1042 * caller supplied function for every chunk of dquots that we find.
1043 */
1044STATIC int
1045xfs_qm_dqiterate(
43ff2122
CH
1046 struct xfs_mount *mp,
1047 struct xfs_inode *qip,
1048 uint flags,
1049 struct list_head *buffer_list)
1da177e4 1050{
43ff2122 1051 struct xfs_bmbt_irec *map;
1da177e4
LT
1052 int i, nmaps; /* number of map entries */
1053 int error; /* return value */
1054 xfs_fileoff_t lblkno;
1055 xfs_filblks_t maxlblkcnt;
1056 xfs_dqid_t firstid;
1057 xfs_fsblock_t rablkno;
1058 xfs_filblks_t rablkcnt;
1059
1060 error = 0;
1061 /*
c41564b5 1062 * This looks racy, but we can't keep an inode lock across a
1da177e4
LT
1063 * trans_reserve. But, this gets called during quotacheck, and that
1064 * happens only at mount time which is single threaded.
1065 */
1066 if (qip->i_d.di_nblocks == 0)
014c2544 1067 return 0;
1da177e4
LT
1068
1069 map = kmem_alloc(XFS_DQITER_MAP_SIZE * sizeof(*map), KM_SLEEP);
1070
1071 lblkno = 0;
32972383 1072 maxlblkcnt = XFS_B_TO_FSB(mp, mp->m_super->s_maxbytes);
1da177e4
LT
1073 do {
1074 nmaps = XFS_DQITER_MAP_SIZE;
1075 /*
1076 * We aren't changing the inode itself. Just changing
1077 * some of its data. No new blocks are added here, and
1078 * the inode is never added to the transaction.
1079 */
1080 xfs_ilock(qip, XFS_ILOCK_SHARED);
5c8ed202
DC
1081 error = xfs_bmapi_read(qip, lblkno, maxlblkcnt - lblkno,
1082 map, &nmaps, 0);
1da177e4
LT
1083 xfs_iunlock(qip, XFS_ILOCK_SHARED);
1084 if (error)
1085 break;
1086
1087 ASSERT(nmaps <= XFS_DQITER_MAP_SIZE);
1088 for (i = 0; i < nmaps; i++) {
1089 ASSERT(map[i].br_startblock != DELAYSTARTBLOCK);
1090 ASSERT(map[i].br_blockcount);
1091
1092
1093 lblkno += map[i].br_blockcount;
1094
1095 if (map[i].br_startblock == HOLESTARTBLOCK)
1096 continue;
1097
1098 firstid = (xfs_dqid_t) map[i].br_startoff *
8a7b8a89 1099 mp->m_quotainfo->qi_dqperchunk;
1da177e4
LT
1100 /*
1101 * Do a read-ahead on the next extent.
1102 */
1103 if ((i+1 < nmaps) &&
1104 (map[i+1].br_startblock != HOLESTARTBLOCK)) {
1105 rablkcnt = map[i+1].br_blockcount;
1106 rablkno = map[i+1].br_startblock;
1107 while (rablkcnt--) {
1a1a3e97 1108 xfs_buf_readahead(mp->m_ddev_targp,
1da177e4 1109 XFS_FSB_TO_DADDR(mp, rablkno),
c3f8fc73
DC
1110 mp->m_quotainfo->qi_dqchunklen,
1111 NULL);
1da177e4
LT
1112 rablkno++;
1113 }
1114 }
1115 /*
1116 * Iterate thru all the blks in the extent and
1117 * reset the counters of all the dquots inside them.
1118 */
43ff2122
CH
1119 error = xfs_qm_dqiter_bufs(mp, firstid,
1120 map[i].br_startblock,
1121 map[i].br_blockcount,
1122 flags, buffer_list);
1123 if (error)
1124 goto out;
1da177e4 1125 }
1da177e4
LT
1126 } while (nmaps > 0);
1127
43ff2122 1128out:
f0e2d93c 1129 kmem_free(map);
014c2544 1130 return error;
1da177e4
LT
1131}
1132
1133/*
1134 * Called by dqusage_adjust in doing a quotacheck.
52fda114
CH
1135 *
1136 * Given the inode, and a dquot id this updates both the incore dqout as well
1137 * as the buffer copy. This is so that once the quotacheck is done, we can
1138 * just log all the buffers, as opposed to logging numerous updates to
1139 * individual dquots.
1da177e4 1140 */
52fda114 1141STATIC int
1da177e4 1142xfs_qm_quotacheck_dqadjust(
52fda114
CH
1143 struct xfs_inode *ip,
1144 xfs_dqid_t id,
1145 uint type,
1da177e4
LT
1146 xfs_qcnt_t nblks,
1147 xfs_qcnt_t rtblks)
1148{
52fda114
CH
1149 struct xfs_mount *mp = ip->i_mount;
1150 struct xfs_dquot *dqp;
1151 int error;
1152
1153 error = xfs_qm_dqget(mp, ip, id, type,
1154 XFS_QMOPT_DQALLOC | XFS_QMOPT_DOWARN, &dqp);
1155 if (error) {
1156 /*
1157 * Shouldn't be able to turn off quotas here.
1158 */
1159 ASSERT(error != ESRCH);
1160 ASSERT(error != ENOENT);
1161 return error;
1162 }
0b1b213f
CH
1163
1164 trace_xfs_dqadjust(dqp);
1165
1da177e4
LT
1166 /*
1167 * Adjust the inode count and the block count to reflect this inode's
1168 * resource usage.
1169 */
413d57c9 1170 be64_add_cpu(&dqp->q_core.d_icount, 1);
1da177e4
LT
1171 dqp->q_res_icount++;
1172 if (nblks) {
413d57c9 1173 be64_add_cpu(&dqp->q_core.d_bcount, nblks);
1da177e4
LT
1174 dqp->q_res_bcount += nblks;
1175 }
1176 if (rtblks) {
413d57c9 1177 be64_add_cpu(&dqp->q_core.d_rtbcount, rtblks);
1da177e4
LT
1178 dqp->q_res_rtbcount += rtblks;
1179 }
1180
1181 /*
1182 * Set default limits, adjust timers (since we changed usages)
191f8488
CH
1183 *
1184 * There are no timers for the default values set in the root dquot.
1da177e4 1185 */
191f8488 1186 if (dqp->q_core.d_id) {
4b6eae2e 1187 xfs_qm_adjust_dqlimits(mp, dqp);
52fda114 1188 xfs_qm_adjust_dqtimers(mp, &dqp->q_core);
1da177e4
LT
1189 }
1190
1191 dqp->dq_flags |= XFS_DQ_DIRTY;
52fda114
CH
1192 xfs_qm_dqput(dqp);
1193 return 0;
1da177e4
LT
1194}
1195
1196STATIC int
1197xfs_qm_get_rtblks(
1198 xfs_inode_t *ip,
1199 xfs_qcnt_t *O_rtblks)
1200{
1201 xfs_filblks_t rtblks; /* total rt blks */
4eea22f0 1202 xfs_extnum_t idx; /* extent record index */
1da177e4
LT
1203 xfs_ifork_t *ifp; /* inode fork pointer */
1204 xfs_extnum_t nextents; /* number of extent entries */
1da177e4
LT
1205 int error;
1206
1207 ASSERT(XFS_IS_REALTIME_INODE(ip));
1208 ifp = XFS_IFORK_PTR(ip, XFS_DATA_FORK);
1209 if (!(ifp->if_flags & XFS_IFEXTENTS)) {
1210 if ((error = xfs_iread_extents(NULL, ip, XFS_DATA_FORK)))
014c2544 1211 return error;
1da177e4
LT
1212 }
1213 rtblks = 0;
4eea22f0 1214 nextents = ifp->if_bytes / (uint)sizeof(xfs_bmbt_rec_t);
a6f64d4a
CH
1215 for (idx = 0; idx < nextents; idx++)
1216 rtblks += xfs_bmbt_get_blockcount(xfs_iext_get_ext(ifp, idx));
1da177e4 1217 *O_rtblks = (xfs_qcnt_t)rtblks;
014c2544 1218 return 0;
1da177e4
LT
1219}
1220
1221/*
1222 * callback routine supplied to bulkstat(). Given an inumber, find its
1223 * dquots and update them to account for resources taken by that inode.
1224 */
1225/* ARGSUSED */
1226STATIC int
1227xfs_qm_dqusage_adjust(
1228 xfs_mount_t *mp, /* mount point for filesystem */
1229 xfs_ino_t ino, /* inode number to get data for */
1230 void __user *buffer, /* not used */
1231 int ubsize, /* not used */
1da177e4 1232 int *ubused, /* not used */
1da177e4
LT
1233 int *res) /* result code value */
1234{
1235 xfs_inode_t *ip;
52fda114 1236 xfs_qcnt_t nblks, rtblks = 0;
1da177e4
LT
1237 int error;
1238
1239 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1240
1241 /*
1242 * rootino must have its resources accounted for, not so with the quota
1243 * inodes.
1244 */
9cad19d2 1245 if (xfs_is_quota_inode(&mp->m_sb, ino)) {
1da177e4
LT
1246 *res = BULKSTAT_RV_NOTHING;
1247 return XFS_ERROR(EINVAL);
1248 }
1249
1250 /*
1251 * We don't _need_ to take the ilock EXCL. However, the xfs_qm_dqget
1252 * interface expects the inode to be exclusively locked because that's
1253 * the case in all other instances. It's OK that we do this because
1254 * quotacheck is done only at mount time.
1255 */
52fda114
CH
1256 error = xfs_iget(mp, NULL, ino, 0, XFS_ILOCK_EXCL, &ip);
1257 if (error) {
1da177e4 1258 *res = BULKSTAT_RV_NOTHING;
014c2544 1259 return error;
1da177e4
LT
1260 }
1261
52fda114 1262 ASSERT(ip->i_delayed_blks == 0);
1da177e4 1263
52fda114 1264 if (XFS_IS_REALTIME_INODE(ip)) {
1da177e4
LT
1265 /*
1266 * Walk thru the extent list and count the realtime blocks.
1267 */
52fda114
CH
1268 error = xfs_qm_get_rtblks(ip, &rtblks);
1269 if (error)
1270 goto error0;
1da177e4 1271 }
1da177e4 1272
52fda114 1273 nblks = (xfs_qcnt_t)ip->i_d.di_nblocks - rtblks;
1da177e4
LT
1274
1275 /*
1276 * Add the (disk blocks and inode) resources occupied by this
1277 * inode to its dquots. We do this adjustment in the incore dquot,
1278 * and also copy the changes to its buffer.
1279 * We don't care about putting these changes in a transaction
1280 * envelope because if we crash in the middle of a 'quotacheck'
1281 * we have to start from the beginning anyway.
1282 * Once we're done, we'll log all the dquot bufs.
1283 *
c41564b5 1284 * The *QUOTA_ON checks below may look pretty racy, but quotachecks
1da177e4
LT
1285 * and quotaoffs don't race. (Quotachecks happen at mount time only).
1286 */
1287 if (XFS_IS_UQUOTA_ON(mp)) {
52fda114
CH
1288 error = xfs_qm_quotacheck_dqadjust(ip, ip->i_d.di_uid,
1289 XFS_DQ_USER, nblks, rtblks);
1290 if (error)
1291 goto error0;
1da177e4 1292 }
52fda114
CH
1293
1294 if (XFS_IS_GQUOTA_ON(mp)) {
1295 error = xfs_qm_quotacheck_dqadjust(ip, ip->i_d.di_gid,
1296 XFS_DQ_GROUP, nblks, rtblks);
1297 if (error)
1298 goto error0;
1da177e4 1299 }
1da177e4 1300
52fda114 1301 if (XFS_IS_PQUOTA_ON(mp)) {
6743099c 1302 error = xfs_qm_quotacheck_dqadjust(ip, xfs_get_projid(ip),
52fda114
CH
1303 XFS_DQ_PROJ, nblks, rtblks);
1304 if (error)
1305 goto error0;
1306 }
1307
1308 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1309 IRELE(ip);
1da177e4 1310 *res = BULKSTAT_RV_DIDONE;
014c2544 1311 return 0;
52fda114
CH
1312
1313error0:
1314 xfs_iunlock(ip, XFS_ILOCK_EXCL);
1315 IRELE(ip);
1316 *res = BULKSTAT_RV_GIVEUP;
1317 return error;
1da177e4
LT
1318}
1319
b84a3a96
CH
1320STATIC int
1321xfs_qm_flush_one(
43ff2122
CH
1322 struct xfs_dquot *dqp,
1323 void *data)
b84a3a96 1324{
43ff2122 1325 struct list_head *buffer_list = data;
fe7257fd 1326 struct xfs_buf *bp = NULL;
b84a3a96
CH
1327 int error = 0;
1328
1329 xfs_dqlock(dqp);
1330 if (dqp->dq_flags & XFS_DQ_FREEING)
1331 goto out_unlock;
1332 if (!XFS_DQ_IS_DIRTY(dqp))
1333 goto out_unlock;
1334
43ff2122 1335 xfs_dqflock(dqp);
fe7257fd
CH
1336 error = xfs_qm_dqflush(dqp, &bp);
1337 if (error)
1338 goto out_unlock;
b84a3a96 1339
43ff2122 1340 xfs_buf_delwri_queue(bp, buffer_list);
fe7257fd 1341 xfs_buf_relse(bp);
b84a3a96
CH
1342out_unlock:
1343 xfs_dqunlock(dqp);
1344 return error;
1345}
1346
1da177e4
LT
1347/*
1348 * Walk thru all the filesystem inodes and construct a consistent view
1349 * of the disk quota world. If the quotacheck fails, disable quotas.
1350 */
1351int
1352xfs_qm_quotacheck(
1353 xfs_mount_t *mp)
1354{
113a5683
CS
1355 int done, count, error, error2;
1356 xfs_ino_t lastino;
1357 size_t structsz;
1358 uint flags;
1359 LIST_HEAD (buffer_list);
1360 struct xfs_inode *uip = mp->m_quotainfo->qi_uquotaip;
1361 struct xfs_inode *gip = mp->m_quotainfo->qi_gquotaip;
92f8ff73 1362 struct xfs_inode *pip = mp->m_quotainfo->qi_pquotaip;
1da177e4
LT
1363
1364 count = INT_MAX;
1365 structsz = 1;
1366 lastino = 0;
1367 flags = 0;
1368
92f8ff73 1369 ASSERT(uip || gip || pip);
1da177e4
LT
1370 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1371
0b932ccc 1372 xfs_notice(mp, "Quotacheck needed: Please wait.");
1da177e4
LT
1373
1374 /*
c8ad20ff 1375 * First we go thru all the dquots on disk, USR and GRP/PRJ, and reset
1da177e4
LT
1376 * their counters to zero. We need a clean slate.
1377 * We don't log our changes till later.
1378 */
8a7b8a89 1379 if (uip) {
43ff2122
CH
1380 error = xfs_qm_dqiterate(mp, uip, XFS_QMOPT_UQUOTA,
1381 &buffer_list);
8a7b8a89 1382 if (error)
1da177e4
LT
1383 goto error_return;
1384 flags |= XFS_UQUOTA_CHKD;
1385 }
1386
8a7b8a89 1387 if (gip) {
92f8ff73 1388 error = xfs_qm_dqiterate(mp, gip, XFS_QMOPT_GQUOTA,
43ff2122 1389 &buffer_list);
8a7b8a89 1390 if (error)
1da177e4 1391 goto error_return;
92f8ff73
CS
1392 flags |= XFS_GQUOTA_CHKD;
1393 }
1394
1395 if (pip) {
1396 error = xfs_qm_dqiterate(mp, pip, XFS_QMOPT_PQUOTA,
1397 &buffer_list);
1398 if (error)
1399 goto error_return;
1400 flags |= XFS_PQUOTA_CHKD;
1da177e4
LT
1401 }
1402
1403 do {
1404 /*
1405 * Iterate thru all the inodes in the file system,
1406 * adjusting the corresponding dquot counters in core.
1407 */
7dce11db
CH
1408 error = xfs_bulkstat(mp, &lastino, &count,
1409 xfs_qm_dqusage_adjust,
1410 structsz, NULL, &done);
1411 if (error)
1da177e4
LT
1412 break;
1413
7dce11db 1414 } while (!done);
1da177e4 1415
4b8879df 1416 /*
b84a3a96
CH
1417 * We've made all the changes that we need to make incore. Flush them
1418 * down to disk buffers if everything was updated successfully.
4b8879df 1419 */
43ff2122
CH
1420 if (XFS_IS_UQUOTA_ON(mp)) {
1421 error = xfs_qm_dquot_walk(mp, XFS_DQ_USER, xfs_qm_flush_one,
1422 &buffer_list);
1423 }
b84a3a96 1424 if (XFS_IS_GQUOTA_ON(mp)) {
43ff2122
CH
1425 error2 = xfs_qm_dquot_walk(mp, XFS_DQ_GROUP, xfs_qm_flush_one,
1426 &buffer_list);
b84a3a96
CH
1427 if (!error)
1428 error = error2;
1429 }
1430 if (XFS_IS_PQUOTA_ON(mp)) {
43ff2122
CH
1431 error2 = xfs_qm_dquot_walk(mp, XFS_DQ_PROJ, xfs_qm_flush_one,
1432 &buffer_list);
b84a3a96
CH
1433 if (!error)
1434 error = error2;
1435 }
4b8879df 1436
43ff2122
CH
1437 error2 = xfs_buf_delwri_submit(&buffer_list);
1438 if (!error)
1439 error = error2;
1440
1da177e4
LT
1441 /*
1442 * We can get this error if we couldn't do a dquot allocation inside
1443 * xfs_qm_dqusage_adjust (via bulkstat). We don't care about the
1444 * dirty dquots that might be cached, we just want to get rid of them
1445 * and turn quotaoff. The dquots won't be attached to any of the inodes
1446 * at this point (because we intentionally didn't in dqget_noattach).
1447 */
1448 if (error) {
8112e9dc 1449 xfs_qm_dqpurge_all(mp, XFS_QMOPT_QUOTALL);
1da177e4
LT
1450 goto error_return;
1451 }
1da177e4 1452
1da177e4
LT
1453 /*
1454 * If one type of quotas is off, then it will lose its
1455 * quotachecked status, since we won't be doing accounting for
1456 * that type anymore.
1457 */
4177af3a 1458 mp->m_qflags &= ~XFS_ALL_QUOTA_CHKD;
1da177e4
LT
1459 mp->m_qflags |= flags;
1460
1da177e4 1461 error_return:
43ff2122
CH
1462 while (!list_empty(&buffer_list)) {
1463 struct xfs_buf *bp =
1464 list_first_entry(&buffer_list, struct xfs_buf, b_list);
1465 list_del_init(&bp->b_list);
1466 xfs_buf_relse(bp);
1467 }
1468
1da177e4 1469 if (error) {
0b932ccc
DC
1470 xfs_warn(mp,
1471 "Quotacheck: Unsuccessful (Error %d): Disabling quotas.",
1472 error);
1da177e4
LT
1473 /*
1474 * We must turn off quotas.
1475 */
1476 ASSERT(mp->m_quotainfo != NULL);
1da177e4 1477 xfs_qm_destroy_quotainfo(mp);
31d5577b 1478 if (xfs_mount_reset_sbqflags(mp)) {
0b932ccc
DC
1479 xfs_warn(mp,
1480 "Quotacheck: Failed to reset quota flags.");
31d5577b 1481 }
0b932ccc
DC
1482 } else
1483 xfs_notice(mp, "Quotacheck: Done.");
1da177e4
LT
1484 return (error);
1485}
1486
1487/*
1488 * This is called after the superblock has been read in and we're ready to
1489 * iget the quota inodes.
1490 */
1491STATIC int
1492xfs_qm_init_quotainos(
1493 xfs_mount_t *mp)
1494{
113a5683
CS
1495 struct xfs_inode *uip = NULL;
1496 struct xfs_inode *gip = NULL;
92f8ff73 1497 struct xfs_inode *pip = NULL;
113a5683
CS
1498 int error;
1499 __int64_t sbflags = 0;
1500 uint flags = 0;
1da177e4
LT
1501
1502 ASSERT(mp->m_quotainfo);
1da177e4
LT
1503
1504 /*
1505 * Get the uquota and gquota inodes
1506 */
62118709 1507 if (xfs_sb_version_hasquota(&mp->m_sb)) {
1da177e4
LT
1508 if (XFS_IS_UQUOTA_ON(mp) &&
1509 mp->m_sb.sb_uquotino != NULLFSINO) {
1510 ASSERT(mp->m_sb.sb_uquotino > 0);
113a5683
CS
1511 error = xfs_iget(mp, NULL, mp->m_sb.sb_uquotino,
1512 0, 0, &uip);
1513 if (error)
1da177e4
LT
1514 return XFS_ERROR(error);
1515 }
92f8ff73 1516 if (XFS_IS_GQUOTA_ON(mp) &&
1da177e4
LT
1517 mp->m_sb.sb_gquotino != NULLFSINO) {
1518 ASSERT(mp->m_sb.sb_gquotino > 0);
113a5683
CS
1519 error = xfs_iget(mp, NULL, mp->m_sb.sb_gquotino,
1520 0, 0, &gip);
1521 if (error)
1522 goto error_rele;
1da177e4 1523 }
92f8ff73 1524 if (XFS_IS_PQUOTA_ON(mp) &&
d892d586
CS
1525 mp->m_sb.sb_pquotino != NULLFSINO) {
1526 ASSERT(mp->m_sb.sb_pquotino > 0);
1527 error = xfs_iget(mp, NULL, mp->m_sb.sb_pquotino,
92f8ff73
CS
1528 0, 0, &pip);
1529 if (error)
1530 goto error_rele;
1531 }
1da177e4
LT
1532 } else {
1533 flags |= XFS_QMOPT_SBVERSION;
1534 sbflags |= (XFS_SB_VERSIONNUM | XFS_SB_UQUOTINO |
d892d586
CS
1535 XFS_SB_GQUOTINO | XFS_SB_PQUOTINO |
1536 XFS_SB_QFLAGS);
1da177e4
LT
1537 }
1538
1539 /*
92f8ff73 1540 * Create the three inodes, if they don't exist already. The changes
1da177e4
LT
1541 * made above will get added to a transaction and logged in one of
1542 * the qino_alloc calls below. If the device is readonly,
1543 * temporarily switch to read-write to do this.
1544 */
1545 if (XFS_IS_UQUOTA_ON(mp) && uip == NULL) {
113a5683 1546 error = xfs_qm_qino_alloc(mp, &uip,
1da177e4 1547 sbflags | XFS_SB_UQUOTINO,
113a5683
CS
1548 flags | XFS_QMOPT_UQUOTA);
1549 if (error)
1550 goto error_rele;
1da177e4
LT
1551
1552 flags &= ~XFS_QMOPT_SBVERSION;
1553 }
92f8ff73 1554 if (XFS_IS_GQUOTA_ON(mp) && gip == NULL) {
c8ad20ff 1555 error = xfs_qm_qino_alloc(mp, &gip,
92f8ff73
CS
1556 sbflags | XFS_SB_GQUOTINO,
1557 flags | XFS_QMOPT_GQUOTA);
1558 if (error)
1559 goto error_rele;
1560
1561 flags &= ~XFS_QMOPT_SBVERSION;
1562 }
1563 if (XFS_IS_PQUOTA_ON(mp) && pip == NULL) {
92f8ff73 1564 error = xfs_qm_qino_alloc(mp, &pip,
d892d586 1565 sbflags | XFS_SB_PQUOTINO,
92f8ff73 1566 flags | XFS_QMOPT_PQUOTA);
113a5683
CS
1567 if (error)
1568 goto error_rele;
1da177e4
LT
1569 }
1570
8a7b8a89
CH
1571 mp->m_quotainfo->qi_uquotaip = uip;
1572 mp->m_quotainfo->qi_gquotaip = gip;
92f8ff73 1573 mp->m_quotainfo->qi_pquotaip = pip;
1da177e4 1574
014c2544 1575 return 0;
113a5683
CS
1576
1577error_rele:
1578 if (uip)
1579 IRELE(uip);
1580 if (gip)
1581 IRELE(gip);
92f8ff73
CS
1582 if (pip)
1583 IRELE(pip);
113a5683 1584 return XFS_ERROR(error);
1da177e4
LT
1585}
1586
92b2e5b3
CH
1587STATIC void
1588xfs_qm_dqfree_one(
1589 struct xfs_dquot *dqp)
1590{
1591 struct xfs_mount *mp = dqp->q_mount;
1592 struct xfs_quotainfo *qi = mp->m_quotainfo;
1da177e4 1593
9f920f11 1594 mutex_lock(&qi->qi_tree_lock);
329e0875 1595 radix_tree_delete(xfs_dquot_tree(qi, dqp->q_core.d_flags),
9f920f11 1596 be32_to_cpu(dqp->q_core.d_id));
368e1361 1597
92b2e5b3 1598 qi->qi_dquots--;
b84a3a96 1599 mutex_unlock(&qi->qi_tree_lock);
92b2e5b3
CH
1600
1601 xfs_qm_dqdestroy(dqp);
1602}
1603
1604STATIC void
1605xfs_qm_dqreclaim_one(
1606 struct xfs_dquot *dqp,
43ff2122 1607 struct list_head *buffer_list,
92b2e5b3 1608 struct list_head *dispose_list)
1da177e4 1609{
92b2e5b3 1610 struct xfs_mount *mp = dqp->q_mount;
f8739c3c 1611 struct xfs_quotainfo *qi = mp->m_quotainfo;
92b2e5b3 1612 int error;
1da177e4 1613
92b2e5b3 1614 if (!xfs_dqlock_nowait(dqp))
b870553c 1615 goto out_move_tail;
bf72de31 1616
92b2e5b3
CH
1617 /*
1618 * This dquot has acquired a reference in the meantime remove it from
1619 * the freelist and try again.
1620 */
1621 if (dqp->q_nrefs) {
1622 xfs_dqunlock(dqp);
1da177e4 1623
92b2e5b3 1624 trace_xfs_dqreclaim_want(dqp);
48776fd2 1625 XFS_STATS_INC(xs_qm_dqwants);
1da177e4 1626
f8739c3c
CH
1627 list_del_init(&dqp->q_lru);
1628 qi->qi_lru_count--;
48776fd2 1629 XFS_STATS_DEC(xs_qm_dquot_unused);
92b2e5b3
CH
1630 return;
1631 }
368e1361 1632
92b2e5b3
CH
1633 /*
1634 * Try to grab the flush lock. If this dquot is in the process of
1635 * getting flushed to disk, we don't want to reclaim it.
1636 */
1637 if (!xfs_dqflock_nowait(dqp))
b870553c 1638 goto out_unlock_move_tail;
0b1b213f 1639
92b2e5b3 1640 if (XFS_DQ_IS_DIRTY(dqp)) {
fe7257fd
CH
1641 struct xfs_buf *bp = NULL;
1642
92b2e5b3 1643 trace_xfs_dqreclaim_dirty(dqp);
0b1b213f 1644
fe7257fd 1645 error = xfs_qm_dqflush(dqp, &bp);
92b2e5b3
CH
1646 if (error) {
1647 xfs_warn(mp, "%s: dquot %p flush failed",
1648 __func__, dqp);
b870553c 1649 goto out_unlock_move_tail;
1da177e4 1650 }
368e1361 1651
43ff2122 1652 xfs_buf_delwri_queue(bp, buffer_list);
fe7257fd 1653 xfs_buf_relse(bp);
1da177e4 1654 /*
92b2e5b3
CH
1655 * Give the dquot another try on the freelist, as the
1656 * flushing will take some time.
1da177e4 1657 */
b870553c 1658 goto out_unlock_move_tail;
92b2e5b3
CH
1659 }
1660 xfs_dqfunlock(dqp);
92678554 1661
92b2e5b3
CH
1662 /*
1663 * Prevent lookups now that we are past the point of no return.
1664 */
1665 dqp->dq_flags |= XFS_DQ_FREEING;
1666 xfs_dqunlock(dqp);
92678554 1667
92b2e5b3 1668 ASSERT(dqp->q_nrefs == 0);
f8739c3c
CH
1669 list_move_tail(&dqp->q_lru, dispose_list);
1670 qi->qi_lru_count--;
48776fd2 1671 XFS_STATS_DEC(xs_qm_dquot_unused);
92678554 1672
92b2e5b3 1673 trace_xfs_dqreclaim_done(dqp);
48776fd2 1674 XFS_STATS_INC(xs_qm_dqreclaims);
92b2e5b3 1675 return;
1da177e4 1676
92b2e5b3
CH
1677 /*
1678 * Move the dquot to the tail of the list so that we don't spin on it.
1679 */
b870553c
DC
1680out_unlock_move_tail:
1681 xfs_dqunlock(dqp);
1682out_move_tail:
f8739c3c 1683 list_move_tail(&dqp->q_lru, &qi->qi_lru_list);
92b2e5b3 1684 trace_xfs_dqreclaim_busy(dqp);
48776fd2 1685 XFS_STATS_INC(xs_qm_dqreclaim_misses);
368e1361 1686}
1da177e4 1687
1da177e4 1688STATIC int
7f8275d0 1689xfs_qm_shake(
92b2e5b3
CH
1690 struct shrinker *shrink,
1691 struct shrink_control *sc)
1da177e4 1692{
f8739c3c
CH
1693 struct xfs_quotainfo *qi =
1694 container_of(shrink, struct xfs_quotainfo, qi_shrinker);
92b2e5b3 1695 int nr_to_scan = sc->nr_to_scan;
43ff2122 1696 LIST_HEAD (buffer_list);
92b2e5b3
CH
1697 LIST_HEAD (dispose_list);
1698 struct xfs_dquot *dqp;
43ff2122 1699 int error;
1da177e4 1700
92b2e5b3 1701 if ((sc->gfp_mask & (__GFP_FS|__GFP_WAIT)) != (__GFP_FS|__GFP_WAIT))
014c2544 1702 return 0;
92b2e5b3
CH
1703 if (!nr_to_scan)
1704 goto out;
1da177e4 1705
f8739c3c
CH
1706 mutex_lock(&qi->qi_lru_lock);
1707 while (!list_empty(&qi->qi_lru_list)) {
92b2e5b3
CH
1708 if (nr_to_scan-- <= 0)
1709 break;
f8739c3c
CH
1710 dqp = list_first_entry(&qi->qi_lru_list, struct xfs_dquot,
1711 q_lru);
43ff2122 1712 xfs_qm_dqreclaim_one(dqp, &buffer_list, &dispose_list);
1da177e4 1713 }
f8739c3c 1714 mutex_unlock(&qi->qi_lru_lock);
1da177e4 1715
43ff2122
CH
1716 error = xfs_buf_delwri_submit(&buffer_list);
1717 if (error)
1718 xfs_warn(NULL, "%s: dquot reclaim failed", __func__);
1719
92b2e5b3 1720 while (!list_empty(&dispose_list)) {
f8739c3c
CH
1721 dqp = list_first_entry(&dispose_list, struct xfs_dquot, q_lru);
1722 list_del_init(&dqp->q_lru);
92b2e5b3
CH
1723 xfs_qm_dqfree_one(dqp);
1724 }
43ff2122 1725
92b2e5b3 1726out:
f8739c3c 1727 return (qi->qi_lru_count / 100) * sysctl_vfs_cache_pressure;
1da177e4
LT
1728}
1729
1da177e4
LT
1730/*
1731 * Start a transaction and write the incore superblock changes to
1732 * disk. flags parameter indicates which fields have changed.
1733 */
1734int
1735xfs_qm_write_sb_changes(
1736 xfs_mount_t *mp,
1737 __int64_t flags)
1738{
1739 xfs_trans_t *tp;
1740 int error;
1741
1da177e4 1742 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_SBCHANGE);
f910a8c6
JL
1743 error = xfs_trans_reserve(tp, 0, XFS_QM_SBCHANGE_LOG_RES(mp),
1744 0, 0, XFS_DEFAULT_LOG_COUNT);
1745 if (error) {
1da177e4 1746 xfs_trans_cancel(tp, 0);
014c2544 1747 return error;
1da177e4
LT
1748 }
1749
1750 xfs_mod_sb(tp, flags);
e5720eec 1751 error = xfs_trans_commit(tp, 0);
1da177e4 1752
e5720eec 1753 return error;
1da177e4
LT
1754}
1755
1756
1757/* --------------- utility functions for vnodeops ---------------- */
1758
1759
1760/*
6c77b0ea 1761 * Given an inode, a uid, gid and prid make sure that we have
1da177e4
LT
1762 * allocated relevant dquot(s) on disk, and that we won't exceed inode
1763 * quotas by creating this file.
1764 * This also attaches dquot(s) to the given inode after locking it,
1765 * and returns the dquots corresponding to the uid and/or gid.
1766 *
1767 * in : inode (unlocked)
1768 * out : udquot, gdquot with references taken and unlocked
1769 */
1770int
1771xfs_qm_vop_dqalloc(
7d095257
CH
1772 struct xfs_inode *ip,
1773 uid_t uid,
1774 gid_t gid,
1775 prid_t prid,
1776 uint flags,
1777 struct xfs_dquot **O_udqpp,
92f8ff73
CS
1778 struct xfs_dquot **O_gdqpp,
1779 struct xfs_dquot **O_pdqpp)
1da177e4 1780{
7d095257 1781 struct xfs_mount *mp = ip->i_mount;
113a5683
CS
1782 struct xfs_dquot *uq = NULL;
1783 struct xfs_dquot *gq = NULL;
92f8ff73 1784 struct xfs_dquot *pq = NULL;
7d095257
CH
1785 int error;
1786 uint lockflags;
1da177e4 1787
7d095257 1788 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
1da177e4
LT
1789 return 0;
1790
1791 lockflags = XFS_ILOCK_EXCL;
1792 xfs_ilock(ip, lockflags);
1793
bd186aa9 1794 if ((flags & XFS_QMOPT_INHERIT) && XFS_INHERIT_GID(ip))
1da177e4
LT
1795 gid = ip->i_d.di_gid;
1796
1797 /*
1798 * Attach the dquot(s) to this inode, doing a dquot allocation
1799 * if necessary. The dquot(s) will not be locked.
1800 */
1801 if (XFS_NOT_DQATTACHED(mp, ip)) {
7d095257
CH
1802 error = xfs_qm_dqattach_locked(ip, XFS_QMOPT_DQALLOC);
1803 if (error) {
1da177e4 1804 xfs_iunlock(ip, lockflags);
014c2544 1805 return error;
1da177e4
LT
1806 }
1807 }
1808
c8ad20ff 1809 if ((flags & XFS_QMOPT_UQUOTA) && XFS_IS_UQUOTA_ON(mp)) {
1da177e4
LT
1810 if (ip->i_d.di_uid != uid) {
1811 /*
1812 * What we need is the dquot that has this uid, and
1813 * if we send the inode to dqget, the uid of the inode
1814 * takes priority over what's sent in the uid argument.
1815 * We must unlock inode here before calling dqget if
1816 * we're not sending the inode, because otherwise
1817 * we'll deadlock by doing trans_reserve while
1818 * holding ilock.
1819 */
1820 xfs_iunlock(ip, lockflags);
113a5683 1821 error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t) uid,
1da177e4
LT
1822 XFS_DQ_USER,
1823 XFS_QMOPT_DQALLOC |
1824 XFS_QMOPT_DOWARN,
113a5683
CS
1825 &uq);
1826 if (error) {
1da177e4 1827 ASSERT(error != ENOENT);
014c2544 1828 return error;
1da177e4
LT
1829 }
1830 /*
1831 * Get the ilock in the right order.
1832 */
1833 xfs_dqunlock(uq);
1834 lockflags = XFS_ILOCK_SHARED;
1835 xfs_ilock(ip, lockflags);
1836 } else {
1837 /*
1838 * Take an extra reference, because we'll return
1839 * this to caller
1840 */
1841 ASSERT(ip->i_udquot);
78e55892 1842 uq = xfs_qm_dqhold(ip->i_udquot);
1da177e4
LT
1843 }
1844 }
c8ad20ff 1845 if ((flags & XFS_QMOPT_GQUOTA) && XFS_IS_GQUOTA_ON(mp)) {
1da177e4
LT
1846 if (ip->i_d.di_gid != gid) {
1847 xfs_iunlock(ip, lockflags);
113a5683 1848 error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t)gid,
1da177e4
LT
1849 XFS_DQ_GROUP,
1850 XFS_QMOPT_DQALLOC |
1851 XFS_QMOPT_DOWARN,
113a5683
CS
1852 &gq);
1853 if (error) {
1da177e4 1854 ASSERT(error != ENOENT);
113a5683 1855 goto error_rele;
1da177e4
LT
1856 }
1857 xfs_dqunlock(gq);
1858 lockflags = XFS_ILOCK_SHARED;
1859 xfs_ilock(ip, lockflags);
1860 } else {
1861 ASSERT(ip->i_gdquot);
78e55892 1862 gq = xfs_qm_dqhold(ip->i_gdquot);
1da177e4 1863 }
92f8ff73
CS
1864 }
1865 if ((flags & XFS_QMOPT_PQUOTA) && XFS_IS_PQUOTA_ON(mp)) {
6743099c 1866 if (xfs_get_projid(ip) != prid) {
c8ad20ff 1867 xfs_iunlock(ip, lockflags);
113a5683 1868 error = xfs_qm_dqget(mp, NULL, (xfs_dqid_t)prid,
c8ad20ff
NS
1869 XFS_DQ_PROJ,
1870 XFS_QMOPT_DQALLOC |
1871 XFS_QMOPT_DOWARN,
92f8ff73 1872 &pq);
113a5683 1873 if (error) {
c8ad20ff 1874 ASSERT(error != ENOENT);
113a5683 1875 goto error_rele;
c8ad20ff 1876 }
92f8ff73 1877 xfs_dqunlock(pq);
c8ad20ff
NS
1878 lockflags = XFS_ILOCK_SHARED;
1879 xfs_ilock(ip, lockflags);
1880 } else {
92f8ff73
CS
1881 ASSERT(ip->i_pdquot);
1882 pq = xfs_qm_dqhold(ip->i_pdquot);
c8ad20ff 1883 }
1da177e4
LT
1884 }
1885 if (uq)
0b1b213f 1886 trace_xfs_dquot_dqalloc(ip);
1da177e4
LT
1887
1888 xfs_iunlock(ip, lockflags);
1889 if (O_udqpp)
1890 *O_udqpp = uq;
1891 else if (uq)
1892 xfs_qm_dqrele(uq);
1893 if (O_gdqpp)
1894 *O_gdqpp = gq;
1895 else if (gq)
1896 xfs_qm_dqrele(gq);
92f8ff73
CS
1897 if (O_pdqpp)
1898 *O_pdqpp = pq;
1899 else if (pq)
1900 xfs_qm_dqrele(pq);
014c2544 1901 return 0;
113a5683
CS
1902
1903error_rele:
92f8ff73
CS
1904 if (gq)
1905 xfs_qm_dqrele(gq);
113a5683
CS
1906 if (uq)
1907 xfs_qm_dqrele(uq);
1908 return error;
1da177e4
LT
1909}
1910
1911/*
1912 * Actually transfer ownership, and do dquot modifications.
1913 * These were already reserved.
1914 */
1915xfs_dquot_t *
1916xfs_qm_vop_chown(
1917 xfs_trans_t *tp,
1918 xfs_inode_t *ip,
1919 xfs_dquot_t **IO_olddq,
1920 xfs_dquot_t *newdq)
1921{
1922 xfs_dquot_t *prevdq;
06d10dd9
NS
1923 uint bfield = XFS_IS_REALTIME_INODE(ip) ?
1924 XFS_TRANS_DQ_RTBCOUNT : XFS_TRANS_DQ_BCOUNT;
1925
7d095257 1926
579aa9ca 1927 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
1da177e4
LT
1928 ASSERT(XFS_IS_QUOTA_RUNNING(ip->i_mount));
1929
1930 /* old dquot */
1931 prevdq = *IO_olddq;
1932 ASSERT(prevdq);
1933 ASSERT(prevdq != newdq);
1934
06d10dd9
NS
1935 xfs_trans_mod_dquot(tp, prevdq, bfield, -(ip->i_d.di_nblocks));
1936 xfs_trans_mod_dquot(tp, prevdq, XFS_TRANS_DQ_ICOUNT, -1);
1da177e4
LT
1937
1938 /* the sparkling new dquot */
06d10dd9
NS
1939 xfs_trans_mod_dquot(tp, newdq, bfield, ip->i_d.di_nblocks);
1940 xfs_trans_mod_dquot(tp, newdq, XFS_TRANS_DQ_ICOUNT, 1);
1da177e4
LT
1941
1942 /*
78e55892
CH
1943 * Take an extra reference, because the inode is going to keep
1944 * this dquot pointer even after the trans_commit.
1da177e4 1945 */
78e55892 1946 *IO_olddq = xfs_qm_dqhold(newdq);
1da177e4 1947
014c2544 1948 return prevdq;
1da177e4
LT
1949}
1950
1951/*
c8ad20ff 1952 * Quota reservations for setattr(AT_UID|AT_GID|AT_PROJID).
1da177e4
LT
1953 */
1954int
1955xfs_qm_vop_chown_reserve(
113a5683
CS
1956 struct xfs_trans *tp,
1957 struct xfs_inode *ip,
1958 struct xfs_dquot *udqp,
1959 struct xfs_dquot *gdqp,
92f8ff73 1960 struct xfs_dquot *pdqp,
113a5683 1961 uint flags)
1da177e4 1962{
113a5683
CS
1963 struct xfs_mount *mp = ip->i_mount;
1964 uint delblks, blkflags, prjflags = 0;
1965 struct xfs_dquot *udq_unres = NULL;
1966 struct xfs_dquot *gdq_unres = NULL;
92f8ff73 1967 struct xfs_dquot *pdq_unres = NULL;
113a5683
CS
1968 struct xfs_dquot *udq_delblks = NULL;
1969 struct xfs_dquot *gdq_delblks = NULL;
92f8ff73 1970 struct xfs_dquot *pdq_delblks = NULL;
113a5683 1971 int error;
7d095257 1972
1da177e4 1973
579aa9ca 1974 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL|XFS_ILOCK_SHARED));
1da177e4
LT
1975 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1976
1977 delblks = ip->i_delayed_blks;
06d10dd9
NS
1978 blkflags = XFS_IS_REALTIME_INODE(ip) ?
1979 XFS_QMOPT_RES_RTBLKS : XFS_QMOPT_RES_REGBLKS;
1da177e4
LT
1980
1981 if (XFS_IS_UQUOTA_ON(mp) && udqp &&
1149d96a 1982 ip->i_d.di_uid != (uid_t)be32_to_cpu(udqp->q_core.d_id)) {
113a5683 1983 udq_delblks = udqp;
1da177e4
LT
1984 /*
1985 * If there are delayed allocation blocks, then we have to
1986 * unreserve those from the old dquot, and add them to the
1987 * new dquot.
1988 */
1989 if (delblks) {
1990 ASSERT(ip->i_udquot);
113a5683 1991 udq_unres = ip->i_udquot;
1da177e4
LT
1992 }
1993 }
92f8ff73
CS
1994 if (XFS_IS_GQUOTA_ON(ip->i_mount) && gdqp &&
1995 ip->i_d.di_gid != be32_to_cpu(gdqp->q_core.d_id)) {
1996 gdq_delblks = gdqp;
1997 if (delblks) {
1998 ASSERT(ip->i_gdquot);
1999 gdq_unres = ip->i_gdquot;
2000 }
2001 }
2002
2003 if (XFS_IS_PQUOTA_ON(ip->i_mount) && pdqp &&
2004 xfs_get_projid(ip) != be32_to_cpu(pdqp->q_core.d_id)) {
2005 prjflags = XFS_QMOPT_ENOSPC;
2006 pdq_delblks = pdqp;
2007 if (delblks) {
2008 ASSERT(ip->i_pdquot);
2009 pdq_unres = ip->i_pdquot;
1da177e4
LT
2010 }
2011 }
2012
113a5683 2013 error = xfs_trans_reserve_quota_bydquots(tp, ip->i_mount,
92f8ff73
CS
2014 udq_delblks, gdq_delblks, pdq_delblks,
2015 ip->i_d.di_nblocks, 1,
113a5683
CS
2016 flags | blkflags | prjflags);
2017 if (error)
2018 return error;
1da177e4
LT
2019
2020 /*
2021 * Do the delayed blks reservations/unreservations now. Since, these
2022 * are done without the help of a transaction, if a reservation fails
2023 * its previous reservations won't be automatically undone by trans
2024 * code. So, we have to do it manually here.
2025 */
2026 if (delblks) {
2027 /*
2028 * Do the reservations first. Unreservation can't fail.
2029 */
92f8ff73
CS
2030 ASSERT(udq_delblks || gdq_delblks || pdq_delblks);
2031 ASSERT(udq_unres || gdq_unres || pdq_unres);
113a5683 2032 error = xfs_trans_reserve_quota_bydquots(NULL, ip->i_mount,
92f8ff73
CS
2033 udq_delblks, gdq_delblks, pdq_delblks,
2034 (xfs_qcnt_t)delblks, 0,
113a5683
CS
2035 flags | blkflags | prjflags);
2036 if (error)
2037 return error;
1da177e4 2038 xfs_trans_reserve_quota_bydquots(NULL, ip->i_mount,
92f8ff73
CS
2039 udq_unres, gdq_unres, pdq_unres,
2040 -((xfs_qcnt_t)delblks), 0, blkflags);
1da177e4
LT
2041 }
2042
2043 return (0);
2044}
2045
2046int
2047xfs_qm_vop_rename_dqattach(
7d095257 2048 struct xfs_inode **i_tab)
1da177e4 2049{
7d095257
CH
2050 struct xfs_mount *mp = i_tab[0]->i_mount;
2051 int i;
1da177e4 2052
7d095257 2053 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
014c2544 2054 return 0;
1da177e4 2055
7d095257
CH
2056 for (i = 0; (i < 4 && i_tab[i]); i++) {
2057 struct xfs_inode *ip = i_tab[i];
2058 int error;
2059
1da177e4
LT
2060 /*
2061 * Watch out for duplicate entries in the table.
2062 */
7d095257
CH
2063 if (i == 0 || ip != i_tab[i-1]) {
2064 if (XFS_NOT_DQATTACHED(mp, ip)) {
1da177e4
LT
2065 error = xfs_qm_dqattach(ip, 0);
2066 if (error)
014c2544 2067 return error;
1da177e4
LT
2068 }
2069 }
2070 }
014c2544 2071 return 0;
1da177e4
LT
2072}
2073
2074void
7d095257
CH
2075xfs_qm_vop_create_dqattach(
2076 struct xfs_trans *tp,
2077 struct xfs_inode *ip,
2078 struct xfs_dquot *udqp,
92f8ff73
CS
2079 struct xfs_dquot *gdqp,
2080 struct xfs_dquot *pdqp)
1da177e4 2081{
7d095257
CH
2082 struct xfs_mount *mp = tp->t_mountp;
2083
2084 if (!XFS_IS_QUOTA_RUNNING(mp) || !XFS_IS_QUOTA_ON(mp))
1da177e4
LT
2085 return;
2086
579aa9ca 2087 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
7d095257 2088 ASSERT(XFS_IS_QUOTA_RUNNING(mp));
1da177e4
LT
2089
2090 if (udqp) {
1da177e4 2091 ASSERT(ip->i_udquot == NULL);
7d095257 2092 ASSERT(XFS_IS_UQUOTA_ON(mp));
1149d96a 2093 ASSERT(ip->i_d.di_uid == be32_to_cpu(udqp->q_core.d_id));
78e55892
CH
2094
2095 ip->i_udquot = xfs_qm_dqhold(udqp);
1da177e4
LT
2096 xfs_trans_mod_dquot(tp, udqp, XFS_TRANS_DQ_ICOUNT, 1);
2097 }
2098 if (gdqp) {
1da177e4 2099 ASSERT(ip->i_gdquot == NULL);
92f8ff73
CS
2100 ASSERT(XFS_IS_GQUOTA_ON(mp));
2101 ASSERT(ip->i_d.di_gid == be32_to_cpu(gdqp->q_core.d_id));
78e55892 2102 ip->i_gdquot = xfs_qm_dqhold(gdqp);
1da177e4
LT
2103 xfs_trans_mod_dquot(tp, gdqp, XFS_TRANS_DQ_ICOUNT, 1);
2104 }
92f8ff73
CS
2105 if (pdqp) {
2106 ASSERT(ip->i_pdquot == NULL);
2107 ASSERT(XFS_IS_PQUOTA_ON(mp));
2108 ASSERT(xfs_get_projid(ip) == be32_to_cpu(pdqp->q_core.d_id));
2109
2110 ip->i_pdquot = xfs_qm_dqhold(pdqp);
2111 xfs_trans_mod_dquot(tp, pdqp, XFS_TRANS_DQ_ICOUNT, 1);
2112 }
1da177e4
LT
2113}
2114