fs/xfs/xfs_dquot.c

   1 /*
   2  * Copyright (c) 2000-2003 Silicon Graphics, Inc.
   3  * All Rights Reserved.
   4  *
   5  * This program is free software; you can redistribute it and/or
   6  * modify it under the terms of the GNU General Public License as
   7  * published by the Free Software Foundation.
   8  *
   9  * This program is distributed in the hope that it would be useful,
  10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  12  * GNU General Public License for more details.
  13  *
  14  * You should have received a copy of the GNU General Public License
  15  * along with this program; if not, write the Free Software Foundation,
  16  * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
  17  */
  18 #include "xfs.h"
  19 #include "xfs_fs.h"
  20 #include "xfs_format.h"
  21 #include "xfs_bit.h"
  22 #include "xfs_log.h"
  23 #include "xfs_trans.h"
  24 #include "xfs_sb.h"
  25 #include "xfs_ag.h"
  26 #include "xfs_alloc.h"
  27 #include "xfs_quota.h"
  28 #include "xfs_mount.h"
  29 #include "xfs_bmap_btree.h"
  30 #include "xfs_inode.h"
  31 #include "xfs_bmap.h"
  32 #include "xfs_rtalloc.h"
  33 #include "xfs_error.h"
  34 #include "xfs_itable.h"
  35 #include "xfs_attr.h"
  36 #include "xfs_buf_item.h"
  37 #include "xfs_trans_space.h"
  38 #include "xfs_trans_priv.h"
  39 #include "xfs_qm.h"
  40 #include "xfs_cksum.h"
  41 #include "xfs_trace.h"
  42
  43 /*
  44  * Lock order:
  45  *
  46  * ip->i_lock
  47  *   qi->qi_tree_lock
  48  *     dquot->q_qlock (xfs_dqlock() and friends)
  49  *       dquot->q_flush (xfs_dqflock() and friends)
  50  *       qi->qi_lru_lock
  51  *
  52  * If two dquots need to be locked the order is user before group/project,
  53  * otherwise by the lowest id first, see xfs_dqlock2.
  54  */
  55
  56 #ifdef DEBUG
  57 xfs_buftarg_t *xfs_dqerror_target;
  58 int xfs_do_dqerror;
  59 int xfs_dqreq_num;
  60 int xfs_dqerror_mod = 33;
  61 #endif
  62
  63 struct kmem_zone                *xfs_qm_dqtrxzone;
  64 static struct kmem_zone         *xfs_qm_dqzone;
  65
  66 static struct lock_class_key xfs_dquot_other_class;
  67
  68 /*
  69  * This is called to free all the memory associated with a dquot
  70  */
  71 void
  72 xfs_qm_dqdestroy(
  73         xfs_dquot_t     *dqp)
  74 {
  75         ASSERT(list_empty(&dqp->q_lru));
  76
  77         mutex_destroy(&dqp->q_qlock);
  78         kmem_zone_free(xfs_qm_dqzone, dqp);
  79
  80         XFS_STATS_DEC(xs_qm_dquot);
  81 }
  82
  83 /*
  84  * If default limits are in force, push them into the dquot now.
  85  * We overwrite the dquot limits only if they are zero and this
  86  * is not the root dquot.
  87  */
  88 void
  89 xfs_qm_adjust_dqlimits(
  90         struct xfs_mount        *mp,
  91         struct xfs_dquot        *dq)
  92 {
  93         struct xfs_quotainfo    *q = mp->m_quotainfo;
  94         struct xfs_disk_dquot   *d = &dq->q_core;
  95         int                     prealloc = 0;
  96
  97         ASSERT(d->d_id);
  98
  99         if (q->qi_bsoftlimit && !d->d_blk_softlimit) {
 100                 d->d_blk_softlimit = cpu_to_be64(q->qi_bsoftlimit);
 101                 prealloc = 1;
 102         }
 103         if (q->qi_bhardlimit && !d->d_blk_hardlimit) {
 104                 d->d_blk_hardlimit = cpu_to_be64(q->qi_bhardlimit);
 105                 prealloc = 1;
 106         }
 107         if (q->qi_isoftlimit && !d->d_ino_softlimit)
 108                 d->d_ino_softlimit = cpu_to_be64(q->qi_isoftlimit);
 109         if (q->qi_ihardlimit && !d->d_ino_hardlimit)
 110                 d->d_ino_hardlimit = cpu_to_be64(q->qi_ihardlimit);
 111         if (q->qi_rtbsoftlimit && !d->d_rtb_softlimit)
 112                 d->d_rtb_softlimit = cpu_to_be64(q->qi_rtbsoftlimit);
 113         if (q->qi_rtbhardlimit && !d->d_rtb_hardlimit)
 114                 d->d_rtb_hardlimit = cpu_to_be64(q->qi_rtbhardlimit);
 115
 116         if (prealloc)
 117                 xfs_dquot_set_prealloc_limits(dq);
 118 }
 119
 120 /*
 121  * Check the limits and timers of a dquot and start or reset timers
 122  * if necessary.
 123  * This gets called even when quota enforcement is OFF, which makes our
 124  * life a little less complicated. (We just don't reject any quota
 125  * reservations in that case, when enforcement is off).
 126  * We also return 0 as the values of the timers in Q_GETQUOTA calls, when
 127  * enforcement's off.
 128  * In contrast, warnings are a little different in that they don't
 129  * 'automatically' get started when limits get exceeded.  They do
 130  * get reset to zero, however, when we find the count to be under
 131  * the soft limit (they are only ever set non-zero via userspace).
 132  */
 133 void
 134 xfs_qm_adjust_dqtimers(
 135         xfs_mount_t             *mp,
 136         xfs_disk_dquot_t        *d)
 137 {
 138         ASSERT(d->d_id);
 139
 140 #ifdef DEBUG
 141         if (d->d_blk_hardlimit)
 142                 ASSERT(be64_to_cpu(d->d_blk_softlimit) <=
 143                        be64_to_cpu(d->d_blk_hardlimit));
 144         if (d->d_ino_hardlimit)
 145                 ASSERT(be64_to_cpu(d->d_ino_softlimit) <=
 146                        be64_to_cpu(d->d_ino_hardlimit));
 147         if (d->d_rtb_hardlimit)
 148                 ASSERT(be64_to_cpu(d->d_rtb_softlimit) <=
 149                        be64_to_cpu(d->d_rtb_hardlimit));
 150 #endif
 151
 152         if (!d->d_btimer) {
 153                 if ((d->d_blk_softlimit &&
 154                      (be64_to_cpu(d->d_bcount) >
 155                       be64_to_cpu(d->d_blk_softlimit))) ||
 156                     (d->d_blk_hardlimit &&
 157                      (be64_to_cpu(d->d_bcount) >
 158                       be64_to_cpu(d->d_blk_hardlimit)))) {
 159                         d->d_btimer = cpu_to_be32(get_seconds() +
 160                                         mp->m_quotainfo->qi_btimelimit);
 161                 } else {
 162                         d->d_bwarns = 0;
 163                 }
 164         } else {
 165                 if ((!d->d_blk_softlimit ||
 166                      (be64_to_cpu(d->d_bcount) <=
 167                       be64_to_cpu(d->d_blk_softlimit))) &&
 168                     (!d->d_blk_hardlimit ||
 169                     (be64_to_cpu(d->d_bcount) <=
 170                      be64_to_cpu(d->d_blk_hardlimit)))) {
 171                         d->d_btimer = 0;
 172                 }
 173         }
 174
 175         if (!d->d_itimer) {
 176                 if ((d->d_ino_softlimit &&
 177                      (be64_to_cpu(d->d_icount) >
 178                       be64_to_cpu(d->d_ino_softlimit))) ||
 179                     (d->d_ino_hardlimit &&
 180                      (be64_to_cpu(d->d_icount) >
 181                       be64_to_cpu(d->d_ino_hardlimit)))) {
 182                         d->d_itimer = cpu_to_be32(get_seconds() +
 183                                         mp->m_quotainfo->qi_itimelimit);
 184                 } else {
 185                         d->d_iwarns = 0;
 186                 }
 187         } else {
 188                 if ((!d->d_ino_softlimit ||
 189                      (be64_to_cpu(d->d_icount) <=
 190                       be64_to_cpu(d->d_ino_softlimit)))  &&
 191                     (!d->d_ino_hardlimit ||
 192                      (be64_to_cpu(d->d_icount) <=
 193                       be64_to_cpu(d->d_ino_hardlimit)))) {
 194                         d->d_itimer = 0;
 195                 }
 196         }
 197
 198         if (!d->d_rtbtimer) {
 199                 if ((d->d_rtb_softlimit &&
 200                      (be64_to_cpu(d->d_rtbcount) >
 201                       be64_to_cpu(d->d_rtb_softlimit))) ||
 202                     (d->d_rtb_hardlimit &&
 203                      (be64_to_cpu(d->d_rtbcount) >
 204                       be64_to_cpu(d->d_rtb_hardlimit)))) {
 205                         d->d_rtbtimer = cpu_to_be32(get_seconds() +
 206                                         mp->m_quotainfo->qi_rtbtimelimit);
 207                 } else {
 208                         d->d_rtbwarns = 0;
 209                 }
 210         } else {
 211                 if ((!d->d_rtb_softlimit ||
 212                      (be64_to_cpu(d->d_rtbcount) <=
 213                       be64_to_cpu(d->d_rtb_softlimit))) &&
 214                     (!d->d_rtb_hardlimit ||
 215                      (be64_to_cpu(d->d_rtbcount) <=
 216                       be64_to_cpu(d->d_rtb_hardlimit)))) {
 217                         d->d_rtbtimer = 0;
 218                 }
 219         }
 220 }
 221
 222 /*
 223  * initialize a buffer full of dquots and log the whole thing
 224  */
 225 STATIC void
 226 xfs_qm_init_dquot_blk(
 227         xfs_trans_t     *tp,
 228         xfs_mount_t     *mp,
 229         xfs_dqid_t      id,
 230         uint            type,
 231         xfs_buf_t       *bp)
 232 {
 233         struct xfs_quotainfo    *q = mp->m_quotainfo;
 234         xfs_dqblk_t     *d;
 235         int             curid, i;
 236
 237         ASSERT(tp);
 238         ASSERT(xfs_buf_islocked(bp));
 239
 240         d = bp->b_addr;
 241
 242         /*
 243          * ID of the first dquot in the block - id's are zero based.
 244          */
 245         curid = id - (id % q->qi_dqperchunk);
 246         ASSERT(curid >= 0);
 247         memset(d, 0, BBTOB(q->qi_dqchunklen));
 248         for (i = 0; i < q->qi_dqperchunk; i++, d++, curid++) {
 249                 d->dd_diskdq.d_magic = cpu_to_be16(XFS_DQUOT_MAGIC);
 250                 d->dd_diskdq.d_version = XFS_DQUOT_VERSION;
 251                 d->dd_diskdq.d_id = cpu_to_be32(curid);
 252                 d->dd_diskdq.d_flags = type;
 253                 if (xfs_sb_version_hascrc(&mp->m_sb)) {
 254                         uuid_copy(&d->dd_uuid, &mp->m_sb.sb_uuid);
 255                         xfs_update_cksum((char *)d, sizeof(struct xfs_dqblk),
 256                                          XFS_DQUOT_CRC_OFF);
 257                 }
 258         }
 259
 260         xfs_trans_dquot_buf(tp, bp,
 261                             (type & XFS_DQ_USER ? XFS_BLF_UDQUOT_BUF :
 262                             ((type & XFS_DQ_PROJ) ? XFS_BLF_PDQUOT_BUF :
 263                              XFS_BLF_GDQUOT_BUF)));
 264         xfs_trans_log_buf(tp, bp, 0, BBTOB(q->qi_dqchunklen) - 1);
 265 }
 266
 267 /*
 268  * Initialize the dynamic speculative preallocation thresholds. The lo/hi
 269  * watermarks correspond to the soft and hard limits by default. If a soft limit
 270  * is not specified, we use 95% of the hard limit.
 271  */
 272 void
 273 xfs_dquot_set_prealloc_limits(struct xfs_dquot *dqp)
 274 {
 275         __uint64_t space;
 276
 277         dqp->q_prealloc_hi_wmark = be64_to_cpu(dqp->q_core.d_blk_hardlimit);
 278         dqp->q_prealloc_lo_wmark = be64_to_cpu(dqp->q_core.d_blk_softlimit);
 279         if (!dqp->q_prealloc_lo_wmark) {
 280                 dqp->q_prealloc_lo_wmark = dqp->q_prealloc_hi_wmark;
 281                 do_div(dqp->q_prealloc_lo_wmark, 100);
 282                 dqp->q_prealloc_lo_wmark *= 95;
 283         }
 284
 285         space = dqp->q_prealloc_hi_wmark;
 286
 287         do_div(space, 100);
 288         dqp->q_low_space[XFS_QLOWSP_1_PCNT] = space;
 289         dqp->q_low_space[XFS_QLOWSP_3_PCNT] = space * 3;
 290         dqp->q_low_space[XFS_QLOWSP_5_PCNT] = space * 5;
 291 }
 292
 293 STATIC bool
 294 xfs_dquot_buf_verify_crc(
 295         struct xfs_mount        *mp,
 296         struct xfs_buf          *bp)
 297 {
 298         struct xfs_dqblk        *d = (struct xfs_dqblk *)bp->b_addr;
 299         int                     ndquots;
 300         int                     i;
 301
 302         if (!xfs_sb_version_hascrc(&mp->m_sb))
 303                 return true;
 304
 305         /*
 306          * if we are in log recovery, the quota subsystem has not been
 307          * initialised so we have no quotainfo structure. In that case, we need
 308          * to manually calculate the number of dquots in the buffer.
 309          */
 310         if (mp->m_quotainfo)
 311                 ndquots = mp->m_quotainfo->qi_dqperchunk;
 312         else
 313                 ndquots = xfs_qm_calc_dquots_per_chunk(mp,
 314                                         XFS_BB_TO_FSB(mp, bp->b_length));
 315
 316         for (i = 0; i < ndquots; i++, d++) {
 317                 if (!xfs_verify_cksum((char *)d, sizeof(struct xfs_dqblk),
 318                                  XFS_DQUOT_CRC_OFF))
 319                         return false;
 320                 if (!uuid_equal(&d->dd_uuid, &mp->m_sb.sb_uuid))
 321                         return false;
 322         }
 323         return true;
 324 }
 325
 326 STATIC bool
 327 xfs_dquot_buf_verify(
 328         struct xfs_mount        *mp,
 329         struct xfs_buf          *bp)
 330 {
 331         struct xfs_dqblk        *d = (struct xfs_dqblk *)bp->b_addr;
 332         xfs_dqid_t              id = 0;
 333         int                     ndquots;
 334         int                     i;
 335
 336         /*
 337          * if we are in log recovery, the quota subsystem has not been
 338          * initialised so we have no quotainfo structure. In that case, we need
 339          * to manually calculate the number of dquots in the buffer.
 340          */
 341         if (mp->m_quotainfo)
 342                 ndquots = mp->m_quotainfo->qi_dqperchunk;
 343         else
 344                 ndquots = xfs_qm_calc_dquots_per_chunk(mp, bp->b_length);
 345
 346         /*
 347          * On the first read of the buffer, verify that each dquot is valid.
 348          * We don't know what the id of the dquot is supposed to be, just that
 349          * they should be increasing monotonically within the buffer. If the
 350          * first id is corrupt, then it will fail on the second dquot in the
 351          * buffer so corruptions could point to the wrong dquot in this case.
 352          */
 353         for (i = 0; i < ndquots; i++) {
 354                 struct xfs_disk_dquot   *ddq;
 355                 int                     error;
 356
 357                 ddq = &d[i].dd_diskdq;
 358
 359                 if (i == 0)
 360                         id = be32_to_cpu(ddq->d_id);
 361
 362                 error = xfs_qm_dqcheck(mp, ddq, id + i, 0, XFS_QMOPT_DOWARN,
 363                                        "xfs_dquot_buf_verify");
 364                 if (error)
 365                         return false;
 366         }
 367         return true;
 368 }
 369
 370 static void
 371 xfs_dquot_buf_read_verify(
 372         struct xfs_buf  *bp)
 373 {
 374         struct xfs_mount        *mp = bp->b_target->bt_mount;
 375
 376         if (!xfs_dquot_buf_verify_crc(mp, bp) || !xfs_dquot_buf_verify(mp, bp)) {
 377                 XFS_CORRUPTION_ERROR(__func__, XFS_ERRLEVEL_LOW, mp, bp->b_addr);
 378                 xfs_buf_ioerror(bp, EFSCORRUPTED);
 379         }
 380 }
 381
 382 /*
 383  * we don't calculate the CRC here as that is done when the dquot is flushed to
 384  * the buffer after the update is done. This ensures that the dquot in the
 385  * buffer always has an up-to-date CRC value.
 386  */
 387 void
 388 xfs_dquot_buf_write_verify(
 389         struct xfs_buf  *bp)
 390 {
 391         struct xfs_mount        *mp = bp->b_target->bt_mount;
 392
 393         if (!xfs_dquot_buf_verify(mp, bp)) {
 394                 XFS_CORRUPTION_ERROR(__func__, XFS_ERRLEVEL_LOW, mp, bp->b_addr);
 395                 xfs_buf_ioerror(bp, EFSCORRUPTED);
 396                 return;
 397         }
 398 }
 399
 400 const struct xfs_buf_ops xfs_dquot_buf_ops = {
 401         .verify_read = xfs_dquot_buf_read_verify,
 402         .verify_write = xfs_dquot_buf_write_verify,
 403 };
 404
 405 /*
 406  * Allocate a block and fill it with dquots.
 407  * This is called when the bmapi finds a hole.
 408  */
 409 STATIC int
 410 xfs_qm_dqalloc(
 411         xfs_trans_t     **tpp,
 412         xfs_mount_t     *mp,
 413         xfs_dquot_t     *dqp,
 414         xfs_inode_t     *quotip,
 415         xfs_fileoff_t   offset_fsb,
 416         xfs_buf_t       **O_bpp)
 417 {
 418         xfs_fsblock_t   firstblock;
 419         xfs_bmap_free_t flist;
 420         xfs_bmbt_irec_t map;
 421         int             nmaps, error, committed;
 422         xfs_buf_t       *bp;
 423         xfs_trans_t     *tp = *tpp;
 424
 425         ASSERT(tp != NULL);
 426
 427         trace_xfs_dqalloc(dqp);
 428
 429         /*
 430          * Initialize the bmap freelist prior to calling bmapi code.
 431          */
 432         xfs_bmap_init(&flist, &firstblock);
 433         xfs_ilock(quotip, XFS_ILOCK_EXCL);
 434         /*
 435          * Return if this type of quotas is turned off while we didn't
 436          * have an inode lock
 437          */
 438         if (!xfs_this_quota_on(dqp->q_mount, dqp->dq_flags)) {
 439                 xfs_iunlock(quotip, XFS_ILOCK_EXCL);
 440                 return (ESRCH);
 441         }
 442
 443         xfs_trans_ijoin(tp, quotip, XFS_ILOCK_EXCL);
 444         nmaps = 1;
 445         error = xfs_bmapi_write(tp, quotip, offset_fsb,
 446                                 XFS_DQUOT_CLUSTER_SIZE_FSB, XFS_BMAPI_METADATA,
 447                                 &firstblock, XFS_QM_DQALLOC_SPACE_RES(mp),
 448                                 &map, &nmaps, &flist);
 449         if (error)
 450                 goto error0;
 451         ASSERT(map.br_blockcount == XFS_DQUOT_CLUSTER_SIZE_FSB);
 452         ASSERT(nmaps == 1);
 453         ASSERT((map.br_startblock != DELAYSTARTBLOCK) &&
 454                (map.br_startblock != HOLESTARTBLOCK));
 455
 456         /*
 457          * Keep track of the blkno to save a lookup later
 458          */
 459         dqp->q_blkno = XFS_FSB_TO_DADDR(mp, map.br_startblock);
 460
 461         /* now we can just get the buffer (there's nothing to read yet) */
 462         bp = xfs_trans_get_buf(tp, mp->m_ddev_targp,
 463                                dqp->q_blkno,
 464                                mp->m_quotainfo->qi_dqchunklen,
 465                                0);
 466
 467         error = xfs_buf_geterror(bp);
 468         if (error)
 469                 goto error1;
 470         bp->b_ops = &xfs_dquot_buf_ops;
 471
 472         /*
 473          * Make a chunk of dquots out of this buffer and log
 474          * the entire thing.
 475          */
 476         xfs_qm_init_dquot_blk(tp, mp, be32_to_cpu(dqp->q_core.d_id),
 477                               dqp->dq_flags & XFS_DQ_ALLTYPES, bp);
 478
 479         /*
 480          * xfs_bmap_finish() may commit the current transaction and
 481          * start a second transaction if the freelist is not empty.
 482          *
 483          * Since we still want to modify this buffer, we need to
 484          * ensure that the buffer is not released on commit of
 485          * the first transaction and ensure the buffer is added to the
 486          * second transaction.
 487          *
 488          * If there is only one transaction then don't stop the buffer
 489          * from being released when it commits later on.
 490          */
 491
 492         xfs_trans_bhold(tp, bp);
 493
 494         if ((error = xfs_bmap_finish(tpp, &flist, &committed))) {
 495                 goto error1;
 496         }
 497
 498         if (committed) {
 499                 tp = *tpp;
 500                 xfs_trans_bjoin(tp, bp);
 501         } else {
 502                 xfs_trans_bhold_release(tp, bp);
 503         }
 504
 505         *O_bpp = bp;
 506         return 0;
 507
 508       error1:
 509         xfs_bmap_cancel(&flist);
 510       error0:
 511         xfs_iunlock(quotip, XFS_ILOCK_EXCL);
 512
 513         return (error);
 514 }
 515 STATIC int
 516 xfs_qm_dqrepair(
 517         struct xfs_mount        *mp,
 518         struct xfs_trans        *tp,
 519         struct xfs_dquot        *dqp,
 520         xfs_dqid_t              firstid,
 521         struct xfs_buf          **bpp)
 522 {
 523         int                     error;
 524         struct xfs_disk_dquot   *ddq;
 525         struct xfs_dqblk        *d;
 526         int                     i;
 527
 528         /*
 529          * Read the buffer without verification so we get the corrupted
 530          * buffer returned to us. make sure we verify it on write, though.
 531          */
 532         error = xfs_trans_read_buf(mp, tp, mp->m_ddev_targp, dqp->q_blkno,
 533                                    mp->m_quotainfo->qi_dqchunklen,
 534                                    0, bpp, NULL);
 535
 536         if (error) {
 537                 ASSERT(*bpp == NULL);
 538                 return XFS_ERROR(error);
 539         }
 540         (*bpp)->b_ops = &xfs_dquot_buf_ops;
 541
 542         ASSERT(xfs_buf_islocked(*bpp));
 543         d = (struct xfs_dqblk *)(*bpp)->b_addr;
 544
 545         /* Do the actual repair of dquots in this buffer */
 546         for (i = 0; i < mp->m_quotainfo->qi_dqperchunk; i++) {
 547                 ddq = &d[i].dd_diskdq;
 548                 error = xfs_qm_dqcheck(mp, ddq, firstid + i,
 549                                        dqp->dq_flags & XFS_DQ_ALLTYPES,
 550                                        XFS_QMOPT_DQREPAIR, "xfs_qm_dqrepair");
 551                 if (error) {
 552                         /* repair failed, we're screwed */
 553                         xfs_trans_brelse(tp, *bpp);
 554                         return XFS_ERROR(EIO);
 555                 }
 556         }
 557
 558         return 0;
 559 }
 560
 561 /*
 562  * Maps a dquot to the buffer containing its on-disk version.
 563  * This returns a ptr to the buffer containing the on-disk dquot
 564  * in the bpp param, and a ptr to the on-disk dquot within that buffer
 565  */
 566 STATIC int
 567 xfs_qm_dqtobp(
 568         xfs_trans_t             **tpp,
 569         xfs_dquot_t             *dqp,
 570         xfs_disk_dquot_t        **O_ddpp,
 571         xfs_buf_t               **O_bpp,
 572         uint                    flags)
 573 {
 574         struct xfs_bmbt_irec    map;
 575         int                     nmaps = 1, error;
 576         struct xfs_buf          *bp;
 577         struct xfs_inode        *quotip = xfs_dq_to_quota_inode(dqp);
 578         struct xfs_mount        *mp = dqp->q_mount;
 579         xfs_dqid_t              id = be32_to_cpu(dqp->q_core.d_id);
 580         struct xfs_trans        *tp = (tpp ? *tpp : NULL);
 581
 582         dqp->q_fileoffset = (xfs_fileoff_t)id / mp->m_quotainfo->qi_dqperchunk;
 583
 584         xfs_ilock(quotip, XFS_ILOCK_SHARED);
 585         if (!xfs_this_quota_on(dqp->q_mount, dqp->dq_flags)) {
 586                 /*
 587                  * Return if this type of quotas is turned off while we
 588                  * didn't have the quota inode lock.
 589                  */
 590                 xfs_iunlock(quotip, XFS_ILOCK_SHARED);
 591                 return ESRCH;
 592         }
 593
 594         /*
 595          * Find the block map; no allocations yet
 596          */
 597         error = xfs_bmapi_read(quotip, dqp->q_fileoffset,
 598                                XFS_DQUOT_CLUSTER_SIZE_FSB, &map, &nmaps, 0);
 599
 600         xfs_iunlock(quotip, XFS_ILOCK_SHARED);
 601         if (error)
 602                 return error;
 603
 604         ASSERT(nmaps == 1);
 605         ASSERT(map.br_blockcount == 1);
 606
 607         /*
 608          * Offset of dquot in the (fixed sized) dquot chunk.
 609          */
 610         dqp->q_bufoffset = (id % mp->m_quotainfo->qi_dqperchunk) *
 611                 sizeof(xfs_dqblk_t);
 612
 613         ASSERT(map.br_startblock != DELAYSTARTBLOCK);
 614         if (map.br_startblock == HOLESTARTBLOCK) {
 615                 /*
 616                  * We don't allocate unless we're asked to
 617                  */
 618                 if (!(flags & XFS_QMOPT_DQALLOC))
 619                         return ENOENT;
 620
 621                 ASSERT(tp);
 622                 error = xfs_qm_dqalloc(tpp, mp, dqp, quotip,
 623                                         dqp->q_fileoffset, &bp);
 624                 if (error)
 625                         return error;
 626                 tp = *tpp;
 627         } else {
 628                 trace_xfs_dqtobp_read(dqp);
 629
 630                 /*
 631                  * store the blkno etc so that we don't have to do the
 632                  * mapping all the time
 633                  */
 634                 dqp->q_blkno = XFS_FSB_TO_DADDR(mp, map.br_startblock);
 635
 636                 error = xfs_trans_read_buf(mp, tp, mp->m_ddev_targp,
 637                                            dqp->q_blkno,
 638                                            mp->m_quotainfo->qi_dqchunklen,
 639                                            0, &bp, &xfs_dquot_buf_ops);
 640
 641                 if (error == EFSCORRUPTED && (flags & XFS_QMOPT_DQREPAIR)) {
 642                         xfs_dqid_t firstid = (xfs_dqid_t)map.br_startoff *
 643                                                 mp->m_quotainfo->qi_dqperchunk;
 644                         ASSERT(bp == NULL);
 645                         error = xfs_qm_dqrepair(mp, tp, dqp, firstid, &bp);
 646                 }
 647
 648                 if (error) {
 649                         ASSERT(bp == NULL);
 650                         return XFS_ERROR(error);
 651                 }
 652         }
 653
 654         ASSERT(xfs_buf_islocked(bp));
 655         *O_bpp = bp;
 656         *O_ddpp = bp->b_addr + dqp->q_bufoffset;
 657
 658         return (0);
 659 }
 660
 661
 662 /*
 663  * Read in the ondisk dquot using dqtobp() then copy it to an incore version,
 664  * and release the buffer immediately.
 665  *
 666  * If XFS_QMOPT_DQALLOC is set, allocate a dquot on disk if it needed.
 667  */
 668 int
 669 xfs_qm_dqread(
 670         struct xfs_mount        *mp,
 671         xfs_dqid_t              id,
 672         uint                    type,
 673         uint                    flags,
 674         struct xfs_dquot        **O_dqpp)
 675 {
 676         struct xfs_dquot        *dqp;
 677         struct xfs_disk_dquot   *ddqp;
 678         struct xfs_buf          *bp;
 679         struct xfs_trans        *tp = NULL;
 680         int                     error;
 681         int                     cancelflags = 0;
 682
 683
 684         dqp = kmem_zone_zalloc(xfs_qm_dqzone, KM_SLEEP);
 685
 686         dqp->dq_flags = type;
 687         dqp->q_core.d_id = cpu_to_be32(id);
 688         dqp->q_mount = mp;
 689         INIT_LIST_HEAD(&dqp->q_lru);
 690         mutex_init(&dqp->q_qlock);
 691         init_waitqueue_head(&dqp->q_pinwait);
 692
 693         /*
 694          * Because we want to use a counting completion, complete
 695          * the flush completion once to allow a single access to
 696          * the flush completion without blocking.
 697          */
 698         init_completion(&dqp->q_flush);
 699         complete(&dqp->q_flush);
 700
 701         /*
 702          * Make sure group quotas have a different lock class than user
 703          * quotas.
 704          */
 705         if (!(type & XFS_DQ_USER))
 706                 lockdep_set_class(&dqp->q_qlock, &xfs_dquot_other_class);
 707
 708         XFS_STATS_INC(xs_qm_dquot);
 709
 710         trace_xfs_dqread(dqp);
 711
 712         if (flags & XFS_QMOPT_DQALLOC) {
 713                 tp = xfs_trans_alloc(mp, XFS_TRANS_QM_DQALLOC);
 714                 error = xfs_trans_reserve(tp, XFS_QM_DQALLOC_SPACE_RES(mp),
 715                                           XFS_QM_DQALLOC_LOG_RES(mp), 0,
 716                                           XFS_TRANS_PERM_LOG_RES,
 717                                           XFS_WRITE_LOG_COUNT);
 718                 if (error)
 719                         goto error1;
 720                 cancelflags = XFS_TRANS_RELEASE_LOG_RES;
 721         }
 722
 723         /*
 724          * get a pointer to the on-disk dquot and the buffer containing it
 725          * dqp already knows its own type (GROUP/USER).
 726          */
 727         error = xfs_qm_dqtobp(&tp, dqp, &ddqp, &bp, flags);
 728         if (error) {
 729                 /*
 730                  * This can happen if quotas got turned off (ESRCH),
 731                  * or if the dquot didn't exist on disk and we ask to
 732                  * allocate (ENOENT).
 733                  */
 734                 trace_xfs_dqread_fail(dqp);
 735                 cancelflags |= XFS_TRANS_ABORT;
 736                 goto error1;
 737         }
 738
 739         /* copy everything from disk dquot to the incore dquot */
 740         memcpy(&dqp->q_core, ddqp, sizeof(xfs_disk_dquot_t));
 741         xfs_qm_dquot_logitem_init(dqp);
 742
 743         /*
 744          * Reservation counters are defined as reservation plus current usage
 745          * to avoid having to add every time.
 746          */
 747         dqp->q_res_bcount = be64_to_cpu(ddqp->d_bcount);
 748         dqp->q_res_icount = be64_to_cpu(ddqp->d_icount);
 749         dqp->q_res_rtbcount = be64_to_cpu(ddqp->d_rtbcount);
 750
 751         /* initialize the dquot speculative prealloc thresholds */
 752         xfs_dquot_set_prealloc_limits(dqp);
 753
 754         /* Mark the buf so that this will stay incore a little longer */
 755         xfs_buf_set_ref(bp, XFS_DQUOT_REF);
 756
 757         /*
 758          * We got the buffer with a xfs_trans_read_buf() (in dqtobp())
 759          * So we need to release with xfs_trans_brelse().
 760          * The strategy here is identical to that of inodes; we lock
 761          * the dquot in xfs_qm_dqget() before making it accessible to
 762          * others. This is because dquots, like inodes, need a good level of
 763          * concurrency, and we don't want to take locks on the entire buffers
 764          * for dquot accesses.
 765          * Note also that the dquot buffer may even be dirty at this point, if
 766          * this particular dquot was repaired. We still aren't afraid to
 767          * brelse it because we have the changes incore.
 768          */
 769         ASSERT(xfs_buf_islocked(bp));
 770         xfs_trans_brelse(tp, bp);
 771
 772         if (tp) {
 773                 error = xfs_trans_commit(tp, XFS_TRANS_RELEASE_LOG_RES);
 774                 if (error)
 775                         goto error0;
 776         }
 777
 778         *O_dqpp = dqp;
 779         return error;
 780
 781 error1:
 782         if (tp)
 783                 xfs_trans_cancel(tp, cancelflags);
 784 error0:
 785         xfs_qm_dqdestroy(dqp);
 786         *O_dqpp = NULL;
 787         return error;
 788 }
 789
 790 /*
 791  * Given the file system, inode OR id, and type (UDQUOT/GDQUOT), return a
 792  * a locked dquot, doing an allocation (if requested) as needed.
 793  * When both an inode and an id are given, the inode's id takes precedence.
 794  * That is, if the id changes while we don't hold the ilock inside this
 795  * function, the new dquot is returned, not necessarily the one requested
 796  * in the id argument.
 797  */
 798 int
 799 xfs_qm_dqget(
 800         xfs_mount_t     *mp,
 801         xfs_inode_t     *ip,      /* locked inode (optional) */
 802         xfs_dqid_t      id,       /* uid/projid/gid depending on type */
 803         uint            type,     /* XFS_DQ_USER/XFS_DQ_PROJ/XFS_DQ_GROUP */
 804         uint            flags,    /* DQALLOC, DQSUSER, DQREPAIR, DOWARN */
 805         xfs_dquot_t     **O_dqpp) /* OUT : locked incore dquot */
 806 {
 807         struct xfs_quotainfo    *qi = mp->m_quotainfo;
 808         struct radix_tree_root *tree = xfs_dquot_tree(qi, type);
 809         struct xfs_dquot        *dqp;
 810         int                     error;
 811
 812         ASSERT(XFS_IS_QUOTA_RUNNING(mp));
 813         if ((! XFS_IS_UQUOTA_ON(mp) && type == XFS_DQ_USER) ||
 814             (! XFS_IS_PQUOTA_ON(mp) && type == XFS_DQ_PROJ) ||
 815             (! XFS_IS_GQUOTA_ON(mp) && type == XFS_DQ_GROUP)) {
 816                 return (ESRCH);
 817         }
 818
 819 #ifdef DEBUG
 820         if (xfs_do_dqerror) {
 821                 if ((xfs_dqerror_target == mp->m_ddev_targp) &&
 822                     (xfs_dqreq_num++ % xfs_dqerror_mod) == 0) {
 823                         xfs_debug(mp, "Returning error in dqget");
 824                         return (EIO);
 825                 }
 826         }
 827
 828         ASSERT(type == XFS_DQ_USER ||
 829                type == XFS_DQ_PROJ ||
 830                type == XFS_DQ_GROUP);
 831         if (ip) {
 832                 ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
 833                 ASSERT(xfs_inode_dquot(ip, type) == NULL);
 834         }
 835 #endif
 836
 837 restart:
 838         mutex_lock(&qi->qi_tree_lock);
 839         dqp = radix_tree_lookup(tree, id);
 840         if (dqp) {
 841                 xfs_dqlock(dqp);
 842                 if (dqp->dq_flags & XFS_DQ_FREEING) {
 843                         xfs_dqunlock(dqp);
 844                         mutex_unlock(&qi->qi_tree_lock);
 845                         trace_xfs_dqget_freeing(dqp);
 846                         delay(1);
 847                         goto restart;
 848                 }
 849
 850                 dqp->q_nrefs++;
 851                 mutex_unlock(&qi->qi_tree_lock);
 852
 853                 trace_xfs_dqget_hit(dqp);
 854                 XFS_STATS_INC(xs_qm_dqcachehits);
 855                 *O_dqpp = dqp;
 856                 return 0;
 857         }
 858         mutex_unlock(&qi->qi_tree_lock);
 859         XFS_STATS_INC(xs_qm_dqcachemisses);
 860
 861         /*
 862          * Dquot cache miss. We don't want to keep the inode lock across
 863          * a (potential) disk read. Also we don't want to deal with the lock
 864          * ordering between quotainode and this inode. OTOH, dropping the inode
 865          * lock here means dealing with a chown that can happen before
 866          * we re-acquire the lock.
 867          */
 868         if (ip)
 869                 xfs_iunlock(ip, XFS_ILOCK_EXCL);
 870
 871         error = xfs_qm_dqread(mp, id, type, flags, &dqp);
 872
 873         if (ip)
 874                 xfs_ilock(ip, XFS_ILOCK_EXCL);
 875
 876         if (error)
 877                 return error;
 878
 879         if (ip) {
 880                 /*
 881                  * A dquot could be attached to this inode by now, since
 882                  * we had dropped the ilock.
 883                  */
 884                 if (xfs_this_quota_on(mp, type)) {
 885                         struct xfs_dquot        *dqp1;
 886
 887                         dqp1 = xfs_inode_dquot(ip, type);
 888                         if (dqp1) {
 889                                 xfs_qm_dqdestroy(dqp);
 890                                 dqp = dqp1;
 891                                 xfs_dqlock(dqp);
 892                                 goto dqret;
 893                         }
 894                 } else {
 895                         /* inode stays locked on return */
 896                         xfs_qm_dqdestroy(dqp);
 897                         return XFS_ERROR(ESRCH);
 898                 }
 899         }
 900
 901         mutex_lock(&qi->qi_tree_lock);
 902         error = -radix_tree_insert(tree, id, dqp);
 903         if (unlikely(error)) {
 904                 WARN_ON(error != EEXIST);
 905
 906                 /*
 907                  * Duplicate found. Just throw away the new dquot and start
 908                  * over.
 909                  */
 910                 mutex_unlock(&qi->qi_tree_lock);
 911                 trace_xfs_dqget_dup(dqp);
 912                 xfs_qm_dqdestroy(dqp);
 913                 XFS_STATS_INC(xs_qm_dquot_dups);
 914                 goto restart;
 915         }
 916
 917         /*
 918          * We return a locked dquot to the caller, with a reference taken
 919          */
 920         xfs_dqlock(dqp);
 921         dqp->q_nrefs = 1;
 922
 923         qi->qi_dquots++;
 924         mutex_unlock(&qi->qi_tree_lock);
 925
 926  dqret:
 927         ASSERT((ip == NULL) || xfs_isilocked(ip, XFS_ILOCK_EXCL));
 928         trace_xfs_dqget_miss(dqp);
 929         *O_dqpp = dqp;
 930         return (0);
 931 }
 932
 933
 934 STATIC void
 935 xfs_qm_dqput_final(
 936         struct xfs_dquot        *dqp)
 937 {
 938         struct xfs_quotainfo    *qi = dqp->q_mount->m_quotainfo;
 939         struct xfs_dquot        *gdqp;
 940         struct xfs_dquot        *pdqp;
 941
 942         trace_xfs_dqput_free(dqp);
 943
 944         mutex_lock(&qi->qi_lru_lock);
 945         if (list_empty(&dqp->q_lru)) {
 946                 list_add_tail(&dqp->q_lru, &qi->qi_lru_list);
 947                 qi->qi_lru_count++;
 948                 XFS_STATS_INC(xs_qm_dquot_unused);
 949         }
 950         mutex_unlock(&qi->qi_lru_lock);
 951
 952         /*
 953          * If we just added a udquot to the freelist, then we want to release
 954          * the gdquot/pdquot reference that it (probably) has. Otherwise it'll
 955          * keep the gdquot/pdquot from getting reclaimed.
 956          */
 957         gdqp = dqp->q_gdquot;
 958         if (gdqp) {
 959                 xfs_dqlock(gdqp);
 960                 dqp->q_gdquot = NULL;
 961         }
 962
 963         pdqp = dqp->q_pdquot;
 964         if (pdqp) {
 965                 xfs_dqlock(pdqp);
 966                 dqp->q_pdquot = NULL;
 967         }
 968         xfs_dqunlock(dqp);
 969
 970         /*
 971          * If we had a group/project quota hint, release it now.
 972          */
 973         if (gdqp)
 974                 xfs_qm_dqput(gdqp);
 975         if (pdqp)
 976                 xfs_qm_dqput(pdqp);
 977 }
 978
 979 /*
 980  * Release a reference to the dquot (decrement ref-count) and unlock it.
 981  *
 982  * If there is a group quota attached to this dquot, carefully release that
 983  * too without tripping over deadlocks'n'stuff.
 984  */
 985 void
 986 xfs_qm_dqput(
 987         struct xfs_dquot        *dqp)
 988 {
 989         ASSERT(dqp->q_nrefs > 0);
 990         ASSERT(XFS_DQ_IS_LOCKED(dqp));
 991
 992         trace_xfs_dqput(dqp);
 993
 994         if (--dqp->q_nrefs > 0)
 995                 xfs_dqunlock(dqp);
 996         else
 997                 xfs_qm_dqput_final(dqp);
 998 }
 999
1000 /*
1001  * Release a dquot. Flush it if dirty, then dqput() it.
1002  * dquot must not be locked.
1003  */
1004 void
1005 xfs_qm_dqrele(
1006         xfs_dquot_t     *dqp)
1007 {
1008         if (!dqp)
1009                 return;
1010
1011         trace_xfs_dqrele(dqp);
1012
1013         xfs_dqlock(dqp);
1014         /*
1015          * We don't care to flush it if the dquot is dirty here.
1016          * That will create stutters that we want to avoid.
1017          * Instead we do a delayed write when we try to reclaim
1018          * a dirty dquot. Also xfs_sync will take part of the burden...
1019          */
1020         xfs_qm_dqput(dqp);
1021 }
1022
1023 /*
1024  * This is the dquot flushing I/O completion routine.  It is called
1025  * from interrupt level when the buffer containing the dquot is
1026  * flushed to disk.  It is responsible for removing the dquot logitem
1027  * from the AIL if it has not been re-logged, and unlocking the dquot's
1028  * flush lock. This behavior is very similar to that of inodes..
1029  */
1030 STATIC void
1031 xfs_qm_dqflush_done(
1032         struct xfs_buf          *bp,
1033         struct xfs_log_item     *lip)
1034 {
1035         xfs_dq_logitem_t        *qip = (struct xfs_dq_logitem *)lip;
1036         xfs_dquot_t             *dqp = qip->qli_dquot;
1037         struct xfs_ail          *ailp = lip->li_ailp;
1038
1039         /*
1040          * We only want to pull the item from the AIL if its
1041          * location in the log has not changed since we started the flush.
1042          * Thus, we only bother if the dquot's lsn has
1043          * not changed. First we check the lsn outside the lock
1044          * since it's cheaper, and then we recheck while
1045          * holding the lock before removing the dquot from the AIL.
1046          */
1047         if ((lip->li_flags & XFS_LI_IN_AIL) &&
1048             lip->li_lsn == qip->qli_flush_lsn) {
1049
1050                 /* xfs_trans_ail_delete() drops the AIL lock. */
1051                 spin_lock(&ailp->xa_lock);
1052                 if (lip->li_lsn == qip->qli_flush_lsn)
1053                         xfs_trans_ail_delete(ailp, lip, SHUTDOWN_CORRUPT_INCORE);
1054                 else
1055                         spin_unlock(&ailp->xa_lock);
1056         }
1057
1058         /*
1059          * Release the dq's flush lock since we're done with it.
1060          */
1061         xfs_dqfunlock(dqp);
1062 }
1063
1064 /*
1065  * Write a modified dquot to disk.
1066  * The dquot must be locked and the flush lock too taken by caller.
1067  * The flush lock will not be unlocked until the dquot reaches the disk,
1068  * but the dquot is free to be unlocked and modified by the caller
1069  * in the interim. Dquot is still locked on return. This behavior is
1070  * identical to that of inodes.
1071  */
1072 int
1073 xfs_qm_dqflush(
1074         struct xfs_dquot        *dqp,
1075         struct xfs_buf          **bpp)
1076 {
1077         struct xfs_mount        *mp = dqp->q_mount;
1078         struct xfs_buf          *bp;
1079         struct xfs_disk_dquot   *ddqp;
1080         int                     error;
1081
1082         ASSERT(XFS_DQ_IS_LOCKED(dqp));
1083         ASSERT(!completion_done(&dqp->q_flush));
1084
1085         trace_xfs_dqflush(dqp);
1086
1087         *bpp = NULL;
1088
1089         xfs_qm_dqunpin_wait(dqp);
1090
1091         /*
1092          * This may have been unpinned because the filesystem is shutting
1093          * down forcibly. If that's the case we must not write this dquot
1094          * to disk, because the log record didn't make it to disk.
1095          *
1096          * We also have to remove the log item from the AIL in this case,
1097          * as we wait for an emptry AIL as part of the unmount process.
1098          */
1099         if (XFS_FORCED_SHUTDOWN(mp)) {
1100                 struct xfs_log_item     *lip = &dqp->q_logitem.qli_item;
1101                 dqp->dq_flags &= ~XFS_DQ_DIRTY;
1102
1103                 spin_lock(&mp->m_ail->xa_lock);
1104                 if (lip->li_flags & XFS_LI_IN_AIL)
1105                         xfs_trans_ail_delete(mp->m_ail, lip,
1106                                              SHUTDOWN_CORRUPT_INCORE);
1107                 else
1108                         spin_unlock(&mp->m_ail->xa_lock);
1109                 error = XFS_ERROR(EIO);
1110                 goto out_unlock;
1111         }
1112
1113         /*
1114          * Get the buffer containing the on-disk dquot
1115          */
1116         error = xfs_trans_read_buf(mp, NULL, mp->m_ddev_targp, dqp->q_blkno,
1117                                    mp->m_quotainfo->qi_dqchunklen, 0, &bp, NULL);
1118         if (error)
1119                 goto out_unlock;
1120
1121         /*
1122          * Calculate the location of the dquot inside the buffer.
1123          */
1124         ddqp = bp->b_addr + dqp->q_bufoffset;
1125
1126         /*
1127          * A simple sanity check in case we got a corrupted dquot..
1128          */
1129         error = xfs_qm_dqcheck(mp, &dqp->q_core, be32_to_cpu(ddqp->d_id), 0,
1130                            XFS_QMOPT_DOWARN, "dqflush (incore copy)");
1131         if (error) {
1132                 xfs_buf_relse(bp);
1133                 xfs_dqfunlock(dqp);
1134                 xfs_force_shutdown(mp, SHUTDOWN_CORRUPT_INCORE);
1135                 return XFS_ERROR(EIO);
1136         }
1137
1138         /* This is the only portion of data that needs to persist */
1139         memcpy(ddqp, &dqp->q_core, sizeof(xfs_disk_dquot_t));
1140
1141         /*
1142          * Clear the dirty field and remember the flush lsn for later use.
1143          */
1144         dqp->dq_flags &= ~XFS_DQ_DIRTY;
1145
1146         xfs_trans_ail_copy_lsn(mp->m_ail, &dqp->q_logitem.qli_flush_lsn,
1147                                         &dqp->q_logitem.qli_item.li_lsn);
1148
1149         /*
1150          * copy the lsn into the on-disk dquot now while we have the in memory
1151          * dquot here. This can't be done later in the write verifier as we
1152          * can't get access to the log item at that point in time.
1153          *
1154          * We also calculate the CRC here so that the on-disk dquot in the
1155          * buffer always has a valid CRC. This ensures there is no possibility
1156          * of a dquot without an up-to-date CRC getting to disk.
1157          */
1158         if (xfs_sb_version_hascrc(&mp->m_sb)) {
1159                 struct xfs_dqblk *dqb = (struct xfs_dqblk *)ddqp;
1160
1161                 dqb->dd_lsn = cpu_to_be64(dqp->q_logitem.qli_item.li_lsn);
1162                 xfs_update_cksum((char *)dqb, sizeof(struct xfs_dqblk),
1163                                  XFS_DQUOT_CRC_OFF);
1164         }
1165
1166         /*
1167          * Attach an iodone routine so that we can remove this dquot from the
1168          * AIL and release the flush lock once the dquot is synced to disk.
1169          */
1170         xfs_buf_attach_iodone(bp, xfs_qm_dqflush_done,
1171                                   &dqp->q_logitem.qli_item);
1172
1173         /*
1174          * If the buffer is pinned then push on the log so we won't
1175          * get stuck waiting in the write for too long.
1176          */
1177         if (xfs_buf_ispinned(bp)) {
1178                 trace_xfs_dqflush_force(dqp);
1179                 xfs_log_force(mp, 0);
1180         }
1181
1182         trace_xfs_dqflush_done(dqp);
1183         *bpp = bp;
1184         return 0;
1185
1186 out_unlock:
1187         xfs_dqfunlock(dqp);
1188         return XFS_ERROR(EIO);
1189 }
1190
1191 /*
1192  * Lock two xfs_dquot structures.
1193  *
1194  * To avoid deadlocks we always lock the quota structure with
1195  * the lowerd id first.
1196  */
1197 void
1198 xfs_dqlock2(
1199         xfs_dquot_t     *d1,
1200         xfs_dquot_t     *d2)
1201 {
1202         if (d1 && d2) {
1203                 ASSERT(d1 != d2);
1204                 if (be32_to_cpu(d1->q_core.d_id) >
1205                     be32_to_cpu(d2->q_core.d_id)) {
1206                         mutex_lock(&d2->q_qlock);
1207                         mutex_lock_nested(&d1->q_qlock, XFS_QLOCK_NESTED);
1208                 } else {
1209                         mutex_lock(&d1->q_qlock);
1210                         mutex_lock_nested(&d2->q_qlock, XFS_QLOCK_NESTED);
1211                 }
1212         } else if (d1) {
1213                 mutex_lock(&d1->q_qlock);
1214         } else if (d2) {
1215                 mutex_lock(&d2->q_qlock);
1216         }
1217 }
1218
1219 int __init
1220 xfs_qm_init(void)
1221 {
1222         xfs_qm_dqzone =
1223                 kmem_zone_init(sizeof(struct xfs_dquot), "xfs_dquot");
1224         if (!xfs_qm_dqzone)
1225                 goto out;
1226
1227         xfs_qm_dqtrxzone =
1228                 kmem_zone_init(sizeof(struct xfs_dquot_acct), "xfs_dqtrx");
1229         if (!xfs_qm_dqtrxzone)
1230                 goto out_free_dqzone;
1231
1232         return 0;
1233
1234 out_free_dqzone:
1235         kmem_zone_destroy(xfs_qm_dqzone);
1236 out:
1237         return -ENOMEM;
1238 }
1239
1240 void
1241 xfs_qm_exit(void)
1242 {
1243         kmem_zone_destroy(xfs_qm_dqtrxzone);
1244         kmem_zone_destroy(xfs_qm_dqzone);
1245 }