fs/gfs2/super.c

   1 /*
   2  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
   3  * Copyright (C) 2004-2006 Red Hat, Inc.  All rights reserved.
   4  *
   5  * This copyrighted material is made available to anyone wishing to use,
   6  * modify, copy, or redistribute it subject to the terms and conditions
   7  * of the GNU General Public License version 2.
   8  */
   9
  10 #include <linux/sched.h>
  11 #include <linux/slab.h>
  12 #include <linux/spinlock.h>
  13 #include <linux/completion.h>
  14 #include <linux/buffer_head.h>
  15 #include <linux/crc32.h>
  16 #include <linux/gfs2_ondisk.h>
  17 #include <linux/bio.h>
  18 #include <linux/lm_interface.h>
  19
  20 #include "gfs2.h"
  21 #include "incore.h"
  22 #include "bmap.h"
  23 #include "dir.h"
  24 #include "glock.h"
  25 #include "glops.h"
  26 #include "inode.h"
  27 #include "log.h"
  28 #include "meta_io.h"
  29 #include "quota.h"
  30 #include "recovery.h"
  31 #include "rgrp.h"
  32 #include "super.h"
  33 #include "trans.h"
  34 #include "util.h"
  35
  36 static const u32 gfs2_old_fs_formats[] = {
  37         0
  38 };
  39
  40 static const u32 gfs2_old_multihost_formats[] = {
  41         0
  42 };
  43
  44 /**
  45  * gfs2_tune_init - Fill a gfs2_tune structure with default values
  46  * @gt: tune
  47  *
  48  */
  49
  50 void gfs2_tune_init(struct gfs2_tune *gt)
  51 {
  52         spin_lock_init(&gt->gt_spin);
  53
  54         gt->gt_ilimit = 100;
  55         gt->gt_ilimit_tries = 3;
  56         gt->gt_ilimit_min = 1;
  57         gt->gt_demote_secs = 300;
  58         gt->gt_incore_log_blocks = 1024;
  59         gt->gt_log_flush_secs = 60;
  60         gt->gt_jindex_refresh_secs = 60;
  61         gt->gt_scand_secs = 15;
  62         gt->gt_recoverd_secs = 60;
  63         gt->gt_logd_secs = 1;
  64         gt->gt_quotad_secs = 5;
  65         gt->gt_quota_simul_sync = 64;
  66         gt->gt_quota_warn_period = 10;
  67         gt->gt_quota_scale_num = 1;
  68         gt->gt_quota_scale_den = 1;
  69         gt->gt_quota_cache_secs = 300;
  70         gt->gt_quota_quantum = 60;
  71         gt->gt_atime_quantum = 3600;
  72         gt->gt_new_files_jdata = 0;
  73         gt->gt_new_files_directio = 0;
  74         gt->gt_max_readahead = 1 << 18;
  75         gt->gt_lockdump_size = 131072;
  76         gt->gt_stall_secs = 600;
  77         gt->gt_complain_secs = 10;
  78         gt->gt_reclaim_limit = 5000;
  79         gt->gt_statfs_quantum = 30;
  80         gt->gt_statfs_slow = 0;
  81 }
  82
  83 /**
  84  * gfs2_check_sb - Check superblock
  85  * @sdp: the filesystem
  86  * @sb: The superblock
  87  * @silent: Don't print a message if the check fails
  88  *
  89  * Checks the version code of the FS is one that we understand how to
  90  * read and that the sizes of the various on-disk structures have not
  91  * changed.
  92  */
  93
  94 int gfs2_check_sb(struct gfs2_sbd *sdp, struct gfs2_sb_host *sb, int silent)
  95 {
  96         unsigned int x;
  97
  98         if (sb->sb_header.mh_magic != GFS2_MAGIC ||
  99             sb->sb_header.mh_type != GFS2_METATYPE_SB) {
 100                 if (!silent)
 101                         printk(KERN_WARNING "GFS2: not a GFS2 filesystem\n");
 102                 return -EINVAL;
 103         }
 104
 105         /*  If format numbers match exactly, we're done.  */
 106
 107         if (sb->sb_fs_format == GFS2_FORMAT_FS &&
 108             sb->sb_multihost_format == GFS2_FORMAT_MULTI)
 109                 return 0;
 110
 111         if (sb->sb_fs_format != GFS2_FORMAT_FS) {
 112                 for (x = 0; gfs2_old_fs_formats[x]; x++)
 113                         if (gfs2_old_fs_formats[x] == sb->sb_fs_format)
 114                                 break;
 115
 116                 if (!gfs2_old_fs_formats[x]) {
 117                         printk(KERN_WARNING
 118                                "GFS2: code version (%u, %u) is incompatible "
 119                                "with ondisk format (%u, %u)\n",
 120                                GFS2_FORMAT_FS, GFS2_FORMAT_MULTI,
 121                                sb->sb_fs_format, sb->sb_multihost_format);
 122                         printk(KERN_WARNING
 123                                "GFS2: I don't know how to upgrade this FS\n");
 124                         return -EINVAL;
 125                 }
 126         }
 127
 128         if (sb->sb_multihost_format != GFS2_FORMAT_MULTI) {
 129                 for (x = 0; gfs2_old_multihost_formats[x]; x++)
 130                         if (gfs2_old_multihost_formats[x] ==
 131                             sb->sb_multihost_format)
 132                                 break;
 133
 134                 if (!gfs2_old_multihost_formats[x]) {
 135                         printk(KERN_WARNING
 136                                "GFS2: code version (%u, %u) is incompatible "
 137                                "with ondisk format (%u, %u)\n",
 138                                GFS2_FORMAT_FS, GFS2_FORMAT_MULTI,
 139                                sb->sb_fs_format, sb->sb_multihost_format);
 140                         printk(KERN_WARNING
 141                                "GFS2: I don't know how to upgrade this FS\n");
 142                         return -EINVAL;
 143                 }
 144         }
 145
 146         if (!sdp->sd_args.ar_upgrade) {
 147                 printk(KERN_WARNING
 148                        "GFS2: code version (%u, %u) is incompatible "
 149                        "with ondisk format (%u, %u)\n",
 150                        GFS2_FORMAT_FS, GFS2_FORMAT_MULTI,
 151                        sb->sb_fs_format, sb->sb_multihost_format);
 152                 printk(KERN_INFO
 153                        "GFS2: Use the \"upgrade\" mount option to upgrade "
 154                        "the FS\n");
 155                 printk(KERN_INFO "GFS2: See the manual for more details\n");
 156                 return -EINVAL;
 157         }
 158
 159         return 0;
 160 }
 161
 162
 163 static int end_bio_io_page(struct bio *bio, unsigned int bytes_done, int error)
 164 {
 165         struct page *page = bio->bi_private;
 166         if (bio->bi_size)
 167                 return 1;
 168
 169         if (!error)
 170                 SetPageUptodate(page);
 171         else
 172                 printk(KERN_WARNING "gfs2: error %d reading superblock\n", error);
 173         unlock_page(page);
 174         return 0;
 175 }
 176
 177 /**
 178  * gfs2_read_super - Read the gfs2 super block from disk
 179  * @sb: The VFS super block
 180  * @sector: The location of the super block
 181  *
 182  * This uses the bio functions to read the super block from disk
 183  * because we want to be 100% sure that we never read cached data.
 184  * A super block is read twice only during each GFS2 mount and is
 185  * never written to by the filesystem. The first time its read no
 186  * locks are held, and the only details which are looked at are those
 187  * relating to the locking protocol. Once locking is up and working,
 188  * the sb is read again under the lock to establish the location of
 189  * the master directory (contains pointers to journals etc) and the
 190  * root directory.
 191  *
 192  * Returns: A page containing the sb or NULL
 193  */
 194
 195 struct page *gfs2_read_super(struct super_block *sb, sector_t sector)
 196 {
 197         struct page *page;
 198         struct bio *bio;
 199
 200         page = alloc_page(GFP_KERNEL);
 201         if (unlikely(!page))
 202                 return NULL;
 203
 204         ClearPageUptodate(page);
 205         ClearPageDirty(page);
 206         lock_page(page);
 207
 208         bio = bio_alloc(GFP_KERNEL, 1);
 209         if (unlikely(!bio)) {
 210                 __free_page(page);
 211                 return NULL;
 212         }
 213
 214         bio->bi_sector = sector * (sb->s_blocksize >> 9);
 215         bio->bi_bdev = sb->s_bdev;
 216         bio_add_page(bio, page, PAGE_SIZE, 0);
 217
 218         bio->bi_end_io = end_bio_io_page;
 219         bio->bi_private = page;
 220         submit_bio(READ_SYNC | (1 << BIO_RW_META), bio);
 221         wait_on_page_locked(page);
 222         bio_put(bio);
 223         if (!PageUptodate(page)) {
 224                 __free_page(page);
 225                 return NULL;
 226         }
 227         return page;
 228 }
 229
 230 /**
 231  * gfs2_read_sb - Read super block
 232  * @sdp: The GFS2 superblock
 233  * @gl: the glock for the superblock (assumed to be held)
 234  * @silent: Don't print message if mount fails
 235  *
 236  */
 237
 238 int gfs2_read_sb(struct gfs2_sbd *sdp, struct gfs2_glock *gl, int silent)
 239 {
 240         u32 hash_blocks, ind_blocks, leaf_blocks;
 241         u32 tmp_blocks;
 242         unsigned int x;
 243         int error;
 244         struct page *page;
 245         char *sb;
 246
 247         page = gfs2_read_super(sdp->sd_vfs, GFS2_SB_ADDR >> sdp->sd_fsb2bb_shift);
 248         if (!page) {
 249                 if (!silent)
 250                         fs_err(sdp, "can't read superblock\n");
 251                 return -EIO;
 252         }
 253         sb = kmap(page);
 254         gfs2_sb_in(&sdp->sd_sb, sb);
 255         kunmap(page);
 256         __free_page(page);
 257
 258         error = gfs2_check_sb(sdp, &sdp->sd_sb, silent);
 259         if (error)
 260                 return error;
 261
 262         sdp->sd_fsb2bb_shift = sdp->sd_sb.sb_bsize_shift -
 263                                GFS2_BASIC_BLOCK_SHIFT;
 264         sdp->sd_fsb2bb = 1 << sdp->sd_fsb2bb_shift;
 265         sdp->sd_diptrs = (sdp->sd_sb.sb_bsize -
 266                           sizeof(struct gfs2_dinode)) / sizeof(u64);
 267         sdp->sd_inptrs = (sdp->sd_sb.sb_bsize -
 268                           sizeof(struct gfs2_meta_header)) / sizeof(u64);
 269         sdp->sd_jbsize = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_meta_header);
 270         sdp->sd_hash_bsize = sdp->sd_sb.sb_bsize / 2;
 271         sdp->sd_hash_bsize_shift = sdp->sd_sb.sb_bsize_shift - 1;
 272         sdp->sd_hash_ptrs = sdp->sd_hash_bsize / sizeof(u64);
 273         sdp->sd_qc_per_block = (sdp->sd_sb.sb_bsize -
 274                                 sizeof(struct gfs2_meta_header)) /
 275                                 sizeof(struct gfs2_quota_change);
 276
 277         /* Compute maximum reservation required to add a entry to a directory */
 278
 279         hash_blocks = DIV_ROUND_UP(sizeof(u64) * (1 << GFS2_DIR_MAX_DEPTH),
 280                              sdp->sd_jbsize);
 281
 282         ind_blocks = 0;
 283         for (tmp_blocks = hash_blocks; tmp_blocks > sdp->sd_diptrs;) {
 284                 tmp_blocks = DIV_ROUND_UP(tmp_blocks, sdp->sd_inptrs);
 285                 ind_blocks += tmp_blocks;
 286         }
 287
 288         leaf_blocks = 2 + GFS2_DIR_MAX_DEPTH;
 289
 290         sdp->sd_max_dirres = hash_blocks + ind_blocks + leaf_blocks;
 291
 292         sdp->sd_heightsize[0] = sdp->sd_sb.sb_bsize -
 293                                 sizeof(struct gfs2_dinode);
 294         sdp->sd_heightsize[1] = sdp->sd_sb.sb_bsize * sdp->sd_diptrs;
 295         for (x = 2;; x++) {
 296                 u64 space, d;
 297                 u32 m;
 298
 299                 space = sdp->sd_heightsize[x - 1] * sdp->sd_inptrs;
 300                 d = space;
 301                 m = do_div(d, sdp->sd_inptrs);
 302
 303                 if (d != sdp->sd_heightsize[x - 1] || m)
 304                         break;
 305                 sdp->sd_heightsize[x] = space;
 306         }
 307         sdp->sd_max_height = x;
 308         gfs2_assert(sdp, sdp->sd_max_height <= GFS2_MAX_META_HEIGHT);
 309
 310         sdp->sd_jheightsize[0] = sdp->sd_sb.sb_bsize -
 311                                  sizeof(struct gfs2_dinode);
 312         sdp->sd_jheightsize[1] = sdp->sd_jbsize * sdp->sd_diptrs;
 313         for (x = 2;; x++) {
 314                 u64 space, d;
 315                 u32 m;
 316
 317                 space = sdp->sd_jheightsize[x - 1] * sdp->sd_inptrs;
 318                 d = space;
 319                 m = do_div(d, sdp->sd_inptrs);
 320
 321                 if (d != sdp->sd_jheightsize[x - 1] || m)
 322                         break;
 323                 sdp->sd_jheightsize[x] = space;
 324         }
 325         sdp->sd_max_jheight = x;
 326         gfs2_assert(sdp, sdp->sd_max_jheight <= GFS2_MAX_META_HEIGHT);
 327
 328         return 0;
 329 }
 330
 331 /**
 332  * gfs2_jindex_hold - Grab a lock on the jindex
 333  * @sdp: The GFS2 superblock
 334  * @ji_gh: the holder for the jindex glock
 335  *
 336  * This is very similar to the gfs2_rindex_hold() function, except that
 337  * in general we hold the jindex lock for longer periods of time and
 338  * we grab it far less frequently (in general) then the rgrp lock.
 339  *
 340  * Returns: errno
 341  */
 342
 343 int gfs2_jindex_hold(struct gfs2_sbd *sdp, struct gfs2_holder *ji_gh)
 344 {
 345         struct gfs2_inode *dip = GFS2_I(sdp->sd_jindex);
 346         struct qstr name;
 347         char buf[20];
 348         struct gfs2_jdesc *jd;
 349         int error;
 350
 351         name.name = buf;
 352
 353         mutex_lock(&sdp->sd_jindex_mutex);
 354
 355         for (;;) {
 356                 error = gfs2_glock_nq_init(dip->i_gl, LM_ST_SHARED, 0, ji_gh);
 357                 if (error)
 358                         break;
 359
 360                 name.len = sprintf(buf, "journal%u", sdp->sd_journals);
 361                 name.hash = gfs2_disk_hash(name.name, name.len);
 362
 363                 error = gfs2_dir_search(sdp->sd_jindex, &name, NULL, NULL);
 364                 if (error == -ENOENT) {
 365                         error = 0;
 366                         break;
 367                 }
 368
 369                 gfs2_glock_dq_uninit(ji_gh);
 370
 371                 if (error)
 372                         break;
 373
 374                 error = -ENOMEM;
 375                 jd = kzalloc(sizeof(struct gfs2_jdesc), GFP_KERNEL);
 376                 if (!jd)
 377                         break;
 378
 379                 jd->jd_inode = gfs2_lookupi(sdp->sd_jindex, &name, 1, NULL);
 380                 if (!jd->jd_inode || IS_ERR(jd->jd_inode)) {
 381                         if (!jd->jd_inode)
 382                                 error = -ENOENT;
 383                         else
 384                                 error = PTR_ERR(jd->jd_inode);
 385                         kfree(jd);
 386                         break;
 387                 }
 388
 389                 spin_lock(&sdp->sd_jindex_spin);
 390                 jd->jd_jid = sdp->sd_journals++;
 391                 list_add_tail(&jd->jd_list, &sdp->sd_jindex_list);
 392                 spin_unlock(&sdp->sd_jindex_spin);
 393         }
 394
 395         mutex_unlock(&sdp->sd_jindex_mutex);
 396
 397         return error;
 398 }
 399
 400 /**
 401  * gfs2_jindex_free - Clear all the journal index information
 402  * @sdp: The GFS2 superblock
 403  *
 404  */
 405
 406 void gfs2_jindex_free(struct gfs2_sbd *sdp)
 407 {
 408         struct list_head list;
 409         struct gfs2_jdesc *jd;
 410
 411         spin_lock(&sdp->sd_jindex_spin);
 412         list_add(&list, &sdp->sd_jindex_list);
 413         list_del_init(&sdp->sd_jindex_list);
 414         sdp->sd_journals = 0;
 415         spin_unlock(&sdp->sd_jindex_spin);
 416
 417         while (!list_empty(&list)) {
 418                 jd = list_entry(list.next, struct gfs2_jdesc, jd_list);
 419                 list_del(&jd->jd_list);
 420                 iput(jd->jd_inode);
 421                 kfree(jd);
 422         }
 423 }
 424
 425 static struct gfs2_jdesc *jdesc_find_i(struct list_head *head, unsigned int jid)
 426 {
 427         struct gfs2_jdesc *jd;
 428         int found = 0;
 429
 430         list_for_each_entry(jd, head, jd_list) {
 431                 if (jd->jd_jid == jid) {
 432                         found = 1;
 433                         break;
 434                 }
 435         }
 436
 437         if (!found)
 438                 jd = NULL;
 439
 440         return jd;
 441 }
 442
 443 struct gfs2_jdesc *gfs2_jdesc_find(struct gfs2_sbd *sdp, unsigned int jid)
 444 {
 445         struct gfs2_jdesc *jd;
 446
 447         spin_lock(&sdp->sd_jindex_spin);
 448         jd = jdesc_find_i(&sdp->sd_jindex_list, jid);
 449         spin_unlock(&sdp->sd_jindex_spin);
 450
 451         return jd;
 452 }
 453
 454 void gfs2_jdesc_make_dirty(struct gfs2_sbd *sdp, unsigned int jid)
 455 {
 456         struct gfs2_jdesc *jd;
 457
 458         spin_lock(&sdp->sd_jindex_spin);
 459         jd = jdesc_find_i(&sdp->sd_jindex_list, jid);
 460         if (jd)
 461                 jd->jd_dirty = 1;
 462         spin_unlock(&sdp->sd_jindex_spin);
 463 }
 464
 465 struct gfs2_jdesc *gfs2_jdesc_find_dirty(struct gfs2_sbd *sdp)
 466 {
 467         struct gfs2_jdesc *jd;
 468         int found = 0;
 469
 470         spin_lock(&sdp->sd_jindex_spin);
 471
 472         list_for_each_entry(jd, &sdp->sd_jindex_list, jd_list) {
 473                 if (jd->jd_dirty) {
 474                         jd->jd_dirty = 0;
 475                         found = 1;
 476                         break;
 477                 }
 478         }
 479         spin_unlock(&sdp->sd_jindex_spin);
 480
 481         if (!found)
 482                 jd = NULL;
 483
 484         return jd;
 485 }
 486
 487 int gfs2_jdesc_check(struct gfs2_jdesc *jd)
 488 {
 489         struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
 490         struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
 491         int ar;
 492         int error;
 493
 494         if (ip->i_di.di_size < (8 << 20) || ip->i_di.di_size > (1 << 30) ||
 495             (ip->i_di.di_size & (sdp->sd_sb.sb_bsize - 1))) {
 496                 gfs2_consist_inode(ip);
 497                 return -EIO;
 498         }
 499         jd->jd_blocks = ip->i_di.di_size >> sdp->sd_sb.sb_bsize_shift;
 500
 501         error = gfs2_write_alloc_required(ip, 0, ip->i_di.di_size, &ar);
 502         if (!error && ar) {
 503                 gfs2_consist_inode(ip);
 504                 error = -EIO;
 505         }
 506
 507         return error;
 508 }
 509
 510 /**
 511  * gfs2_make_fs_rw - Turn a Read-Only FS into a Read-Write one
 512  * @sdp: the filesystem
 513  *
 514  * Returns: errno
 515  */
 516
 517 int gfs2_make_fs_rw(struct gfs2_sbd *sdp)
 518 {
 519         struct gfs2_inode *ip = GFS2_I(sdp->sd_jdesc->jd_inode);
 520         struct gfs2_glock *j_gl = ip->i_gl;
 521         struct gfs2_holder t_gh;
 522         struct gfs2_log_header_host head;
 523         int error;
 524
 525         error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_SHARED, 0, &t_gh);
 526         if (error)
 527                 return error;
 528
 529         gfs2_meta_cache_flush(ip);
 530         j_gl->gl_ops->go_inval(j_gl, DIO_METADATA);
 531
 532         error = gfs2_find_jhead(sdp->sd_jdesc, &head);
 533         if (error)
 534                 goto fail;
 535
 536         if (!(head.lh_flags & GFS2_LOG_HEAD_UNMOUNT)) {
 537                 gfs2_consist(sdp);
 538                 error = -EIO;
 539                 goto fail;
 540         }
 541
 542         /*  Initialize some head of the log stuff  */
 543         sdp->sd_log_sequence = head.lh_sequence + 1;
 544         gfs2_log_pointers_init(sdp, head.lh_blkno);
 545
 546         error = gfs2_quota_init(sdp);
 547         if (error)
 548                 goto fail;
 549
 550         set_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags);
 551
 552         gfs2_glock_dq_uninit(&t_gh);
 553
 554         return 0;
 555
 556 fail:
 557         t_gh.gh_flags |= GL_NOCACHE;
 558         gfs2_glock_dq_uninit(&t_gh);
 559
 560         return error;
 561 }
 562
 563 /**
 564  * gfs2_make_fs_ro - Turn a Read-Write FS into a Read-Only one
 565  * @sdp: the filesystem
 566  *
 567  * Returns: errno
 568  */
 569
 570 int gfs2_make_fs_ro(struct gfs2_sbd *sdp)
 571 {
 572         struct gfs2_holder t_gh;
 573         int error;
 574
 575         gfs2_quota_sync(sdp);
 576         gfs2_statfs_sync(sdp);
 577
 578         error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_SHARED, GL_NOCACHE,
 579                                    &t_gh);
 580         if (error && !test_bit(SDF_SHUTDOWN, &sdp->sd_flags))
 581                 return error;
 582
 583         gfs2_meta_syncfs(sdp);
 584         gfs2_log_shutdown(sdp);
 585
 586         clear_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags);
 587
 588         if (t_gh.gh_gl)
 589                 gfs2_glock_dq_uninit(&t_gh);
 590
 591         gfs2_quota_cleanup(sdp);
 592
 593         return error;
 594 }
 595
 596 int gfs2_statfs_init(struct gfs2_sbd *sdp)
 597 {
 598         struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
 599         struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
 600         struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
 601         struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
 602         struct buffer_head *m_bh, *l_bh;
 603         struct gfs2_holder gh;
 604         int error;
 605
 606         error = gfs2_glock_nq_init(m_ip->i_gl, LM_ST_EXCLUSIVE, GL_NOCACHE,
 607                                    &gh);
 608         if (error)
 609                 return error;
 610
 611         error = gfs2_meta_inode_buffer(m_ip, &m_bh);
 612         if (error)
 613                 goto out;
 614
 615         if (sdp->sd_args.ar_spectator) {
 616                 spin_lock(&sdp->sd_statfs_spin);
 617                 gfs2_statfs_change_in(m_sc, m_bh->b_data +
 618                                       sizeof(struct gfs2_dinode));
 619                 spin_unlock(&sdp->sd_statfs_spin);
 620         } else {
 621                 error = gfs2_meta_inode_buffer(l_ip, &l_bh);
 622                 if (error)
 623                         goto out_m_bh;
 624
 625                 spin_lock(&sdp->sd_statfs_spin);
 626                 gfs2_statfs_change_in(m_sc, m_bh->b_data +
 627                                       sizeof(struct gfs2_dinode));
 628                 gfs2_statfs_change_in(l_sc, l_bh->b_data +
 629                                       sizeof(struct gfs2_dinode));
 630                 spin_unlock(&sdp->sd_statfs_spin);
 631
 632                 brelse(l_bh);
 633         }
 634
 635 out_m_bh:
 636         brelse(m_bh);
 637 out:
 638         gfs2_glock_dq_uninit(&gh);
 639         return 0;
 640 }
 641
 642 void gfs2_statfs_change(struct gfs2_sbd *sdp, s64 total, s64 free,
 643                         s64 dinodes)
 644 {
 645         struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
 646         struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
 647         struct buffer_head *l_bh;
 648         int error;
 649
 650         error = gfs2_meta_inode_buffer(l_ip, &l_bh);
 651         if (error)
 652                 return;
 653
 654         mutex_lock(&sdp->sd_statfs_mutex);
 655         gfs2_trans_add_bh(l_ip->i_gl, l_bh, 1);
 656         mutex_unlock(&sdp->sd_statfs_mutex);
 657
 658         spin_lock(&sdp->sd_statfs_spin);
 659         l_sc->sc_total += total;
 660         l_sc->sc_free += free;
 661         l_sc->sc_dinodes += dinodes;
 662         gfs2_statfs_change_out(l_sc, l_bh->b_data + sizeof(struct gfs2_dinode));
 663         spin_unlock(&sdp->sd_statfs_spin);
 664
 665         brelse(l_bh);
 666 }
 667
 668 int gfs2_statfs_sync(struct gfs2_sbd *sdp)
 669 {
 670         struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
 671         struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
 672         struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
 673         struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
 674         struct gfs2_holder gh;
 675         struct buffer_head *m_bh, *l_bh;
 676         int error;
 677
 678         error = gfs2_glock_nq_init(m_ip->i_gl, LM_ST_EXCLUSIVE, GL_NOCACHE,
 679                                    &gh);
 680         if (error)
 681                 return error;
 682
 683         error = gfs2_meta_inode_buffer(m_ip, &m_bh);
 684         if (error)
 685                 goto out;
 686
 687         spin_lock(&sdp->sd_statfs_spin);
 688         gfs2_statfs_change_in(m_sc, m_bh->b_data +
 689                               sizeof(struct gfs2_dinode));
 690         if (!l_sc->sc_total && !l_sc->sc_free && !l_sc->sc_dinodes) {
 691                 spin_unlock(&sdp->sd_statfs_spin);
 692                 goto out_bh;
 693         }
 694         spin_unlock(&sdp->sd_statfs_spin);
 695
 696         error = gfs2_meta_inode_buffer(l_ip, &l_bh);
 697         if (error)
 698                 goto out_bh;
 699
 700         error = gfs2_trans_begin(sdp, 2 * RES_DINODE, 0);
 701         if (error)
 702                 goto out_bh2;
 703
 704         mutex_lock(&sdp->sd_statfs_mutex);
 705         gfs2_trans_add_bh(l_ip->i_gl, l_bh, 1);
 706         mutex_unlock(&sdp->sd_statfs_mutex);
 707
 708         spin_lock(&sdp->sd_statfs_spin);
 709         m_sc->sc_total += l_sc->sc_total;
 710         m_sc->sc_free += l_sc->sc_free;
 711         m_sc->sc_dinodes += l_sc->sc_dinodes;
 712         memset(l_sc, 0, sizeof(struct gfs2_statfs_change));
 713         memset(l_bh->b_data + sizeof(struct gfs2_dinode),
 714                0, sizeof(struct gfs2_statfs_change));
 715         spin_unlock(&sdp->sd_statfs_spin);
 716
 717         gfs2_trans_add_bh(m_ip->i_gl, m_bh, 1);
 718         gfs2_statfs_change_out(m_sc, m_bh->b_data + sizeof(struct gfs2_dinode));
 719
 720         gfs2_trans_end(sdp);
 721
 722 out_bh2:
 723         brelse(l_bh);
 724 out_bh:
 725         brelse(m_bh);
 726 out:
 727         gfs2_glock_dq_uninit(&gh);
 728         return error;
 729 }
 730
 731 /**
 732  * gfs2_statfs_i - Do a statfs
 733  * @sdp: the filesystem
 734  * @sg: the sg structure
 735  *
 736  * Returns: errno
 737  */
 738
 739 int gfs2_statfs_i(struct gfs2_sbd *sdp, struct gfs2_statfs_change_host *sc)
 740 {
 741         struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
 742         struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
 743
 744         spin_lock(&sdp->sd_statfs_spin);
 745
 746         *sc = *m_sc;
 747         sc->sc_total += l_sc->sc_total;
 748         sc->sc_free += l_sc->sc_free;
 749         sc->sc_dinodes += l_sc->sc_dinodes;
 750
 751         spin_unlock(&sdp->sd_statfs_spin);
 752
 753         if (sc->sc_free < 0)
 754                 sc->sc_free = 0;
 755         if (sc->sc_free > sc->sc_total)
 756                 sc->sc_free = sc->sc_total;
 757         if (sc->sc_dinodes < 0)
 758                 sc->sc_dinodes = 0;
 759
 760         return 0;
 761 }
 762
 763 /**
 764  * statfs_fill - fill in the sg for a given RG
 765  * @rgd: the RG
 766  * @sc: the sc structure
 767  *
 768  * Returns: 0 on success, -ESTALE if the LVB is invalid
 769  */
 770
 771 static int statfs_slow_fill(struct gfs2_rgrpd *rgd,
 772                             struct gfs2_statfs_change_host *sc)
 773 {
 774         gfs2_rgrp_verify(rgd);
 775         sc->sc_total += rgd->rd_ri.ri_data;
 776         sc->sc_free += rgd->rd_rg.rg_free;
 777         sc->sc_dinodes += rgd->rd_rg.rg_dinodes;
 778         return 0;
 779 }
 780
 781 /**
 782  * gfs2_statfs_slow - Stat a filesystem using asynchronous locking
 783  * @sdp: the filesystem
 784  * @sc: the sc info that will be returned
 785  *
 786  * Any error (other than a signal) will cause this routine to fall back
 787  * to the synchronous version.
 788  *
 789  * FIXME: This really shouldn't busy wait like this.
 790  *
 791  * Returns: errno
 792  */
 793
 794 int gfs2_statfs_slow(struct gfs2_sbd *sdp, struct gfs2_statfs_change_host *sc)
 795 {
 796         struct gfs2_holder ri_gh;
 797         struct gfs2_rgrpd *rgd_next;
 798         struct gfs2_holder *gha, *gh;
 799         unsigned int slots = 64;
 800         unsigned int x;
 801         int done;
 802         int error = 0, err;
 803
 804         memset(sc, 0, sizeof(struct gfs2_statfs_change_host));
 805         gha = kcalloc(slots, sizeof(struct gfs2_holder), GFP_KERNEL);
 806         if (!gha)
 807                 return -ENOMEM;
 808
 809         error = gfs2_rindex_hold(sdp, &ri_gh);
 810         if (error)
 811                 goto out;
 812
 813         rgd_next = gfs2_rgrpd_get_first(sdp);
 814
 815         for (;;) {
 816                 done = 1;
 817
 818                 for (x = 0; x < slots; x++) {
 819                         gh = gha + x;
 820
 821                         if (gh->gh_gl && gfs2_glock_poll(gh)) {
 822                                 err = gfs2_glock_wait(gh);
 823                                 if (err) {
 824                                         gfs2_holder_uninit(gh);
 825                                         error = err;
 826                                 } else {
 827                                         if (!error)
 828                                                 error = statfs_slow_fill(
 829                                                         gh->gh_gl->gl_object, sc);
 830                                         gfs2_glock_dq_uninit(gh);
 831                                 }
 832                         }
 833
 834                         if (gh->gh_gl)
 835                                 done = 0;
 836                         else if (rgd_next && !error) {
 837                                 error = gfs2_glock_nq_init(rgd_next->rd_gl,
 838                                                            LM_ST_SHARED,
 839                                                            GL_ASYNC,
 840                                                            gh);
 841                                 rgd_next = gfs2_rgrpd_get_next(rgd_next);
 842                                 done = 0;
 843                         }
 844
 845                         if (signal_pending(current))
 846                                 error = -ERESTARTSYS;
 847                 }
 848
 849                 if (done)
 850                         break;
 851
 852                 yield();
 853         }
 854
 855         gfs2_glock_dq_uninit(&ri_gh);
 856
 857 out:
 858         kfree(gha);
 859         return error;
 860 }
 861
 862 struct lfcc {
 863         struct list_head list;
 864         struct gfs2_holder gh;
 865 };
 866
 867 /**
 868  * gfs2_lock_fs_check_clean - Stop all writes to the FS and check that all
 869  *                            journals are clean
 870  * @sdp: the file system
 871  * @state: the state to put the transaction lock into
 872  * @t_gh: the hold on the transaction lock
 873  *
 874  * Returns: errno
 875  */
 876
 877 static int gfs2_lock_fs_check_clean(struct gfs2_sbd *sdp,
 878                                     struct gfs2_holder *t_gh)
 879 {
 880         struct gfs2_inode *ip;
 881         struct gfs2_holder ji_gh;
 882         struct gfs2_jdesc *jd;
 883         struct lfcc *lfcc;
 884         LIST_HEAD(list);
 885         struct gfs2_log_header_host lh;
 886         int error;
 887
 888         error = gfs2_jindex_hold(sdp, &ji_gh);
 889         if (error)
 890                 return error;
 891
 892         list_for_each_entry(jd, &sdp->sd_jindex_list, jd_list) {
 893                 lfcc = kmalloc(sizeof(struct lfcc), GFP_KERNEL);
 894                 if (!lfcc) {
 895                         error = -ENOMEM;
 896                         goto out;
 897                 }
 898                 ip = GFS2_I(jd->jd_inode);
 899                 error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, 0, &lfcc->gh);
 900                 if (error) {
 901                         kfree(lfcc);
 902                         goto out;
 903                 }
 904                 list_add(&lfcc->list, &list);
 905         }
 906
 907         error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_DEFERRED,
 908                                LM_FLAG_PRIORITY | GL_NOCACHE,
 909                                t_gh);
 910
 911         list_for_each_entry(jd, &sdp->sd_jindex_list, jd_list) {
 912                 error = gfs2_jdesc_check(jd);
 913                 if (error)
 914                         break;
 915                 error = gfs2_find_jhead(jd, &lh);
 916                 if (error)
 917                         break;
 918                 if (!(lh.lh_flags & GFS2_LOG_HEAD_UNMOUNT)) {
 919                         error = -EBUSY;
 920                         break;
 921                 }
 922         }
 923
 924         if (error)
 925                 gfs2_glock_dq_uninit(t_gh);
 926
 927 out:
 928         while (!list_empty(&list)) {
 929                 lfcc = list_entry(list.next, struct lfcc, list);
 930                 list_del(&lfcc->list);
 931                 gfs2_glock_dq_uninit(&lfcc->gh);
 932                 kfree(lfcc);
 933         }
 934         gfs2_glock_dq_uninit(&ji_gh);
 935         return error;
 936 }
 937
 938 /**
 939  * gfs2_freeze_fs - freezes the file system
 940  * @sdp: the file system
 941  *
 942  * This function flushes data and meta data for all machines by
 943  * aquiring the transaction log exclusively.  All journals are
 944  * ensured to be in a clean state as well.
 945  *
 946  * Returns: errno
 947  */
 948
 949 int gfs2_freeze_fs(struct gfs2_sbd *sdp)
 950 {
 951         int error = 0;
 952
 953         mutex_lock(&sdp->sd_freeze_lock);
 954
 955         if (!sdp->sd_freeze_count++) {
 956                 error = gfs2_lock_fs_check_clean(sdp, &sdp->sd_freeze_gh);
 957                 if (error)
 958                         sdp->sd_freeze_count--;
 959         }
 960
 961         mutex_unlock(&sdp->sd_freeze_lock);
 962
 963         return error;
 964 }
 965
 966 /**
 967  * gfs2_unfreeze_fs - unfreezes the file system
 968  * @sdp: the file system
 969  *
 970  * This function allows the file system to proceed by unlocking
 971  * the exclusively held transaction lock.  Other GFS2 nodes are
 972  * now free to acquire the lock shared and go on with their lives.
 973  *
 974  */
 975
 976 void gfs2_unfreeze_fs(struct gfs2_sbd *sdp)
 977 {
 978         mutex_lock(&sdp->sd_freeze_lock);
 979
 980         if (sdp->sd_freeze_count && !--sdp->sd_freeze_count)
 981                 gfs2_glock_dq_uninit(&sdp->sd_freeze_gh);
 982
 983         mutex_unlock(&sdp->sd_freeze_lock);
 984 }
 985