fedora core 6 1.2949 + vserver 2.2.0

[linux-2.6.git] / fs / ntfs / mft.c
diff --git a/fs/ntfs/mft.c b/fs/ntfs/mft.c

index 6499aaf..2ad5c8b 100644 (file)
--- a/fs/ntfs/mft.c
+++ b/fs/ntfs/mft.c
@@ -93,6 +93,7 @@ static inline MFT_RECORD *map_mft_record_page(ntfs_inode *ni)
                                 "Run chkdsk.", ni->mft_no);
                 ntfs_unmap_page(page);
                 page = ERR_PTR(-EIO);
+               NVolSetErrors(vol);
         }
  err_out:
         ni->page = NULL;
@@ -104,8 +105,8 @@ err_out:
   * map_mft_record - map, pin and lock an mft record
   * @ni:                ntfs inode whose MFT record to map
   *
- * First, take the mrec_lock semaphore. We might now be sleeping, while waiting
- * for the semaphore if it was already locked by someone else.
+ * First, take the mrec_lock mutex.  We might now be sleeping, while waiting
+ * for the mutex if it was already locked by someone else.
   *
   * The page of the record is mapped using map_mft_record_page() before being
   * returned to the caller.
@@ -135,9 +136,9 @@ err_out:
   * So that code will end up having to own the mrec_lock of all mft
   * records/inodes present in the page before I/O can proceed. In that case we
   * wouldn't need to bother with PG_locked and PG_uptodate as nobody will be
- * accessing anything without owning the mrec_lock semaphore. But we do need
- * to use them because of the read_cache_page() invocation and the code becomes
- * so much simpler this way that it is well worth it.
+ * accessing anything without owning the mrec_lock mutex.  But we do need to
+ * use them because of the read_cache_page() invocation and the code becomes so
+ * much simpler this way that it is well worth it.
   *
   * The mft record is now ours and we return a pointer to it. You need to check
   * the returned pointer with IS_ERR() and if that is true, PTR_ERR() will return
@@ -160,13 +161,13 @@ MFT_RECORD *map_mft_record(ntfs_inode *ni)
         atomic_inc(&ni->count);
  
         /* Serialize access to this mft record. */
-       down(&ni->mrec_lock);
+       mutex_lock(&ni->mrec_lock);
  
         m = map_mft_record_page(ni);
         if (likely(!IS_ERR(m)))
                 return m;
  
-       up(&ni->mrec_lock);
+       mutex_unlock(&ni->mrec_lock);
         atomic_dec(&ni->count);
         ntfs_error(ni->vol->sb, "Failed with error code %lu.", -PTR_ERR(m));
         return m;
@@ -217,7 +218,7 @@ void unmap_mft_record(ntfs_inode *ni)
         ntfs_debug("Entering for mft_no 0x%lx.", ni->mft_no);
  
         unmap_mft_record_page(ni);
-       up(&ni->mrec_lock);
+       mutex_unlock(&ni->mrec_lock);
         atomic_dec(&ni->count);
         /*
          * If pure ntfs_inode, i.e. no vfs inode attached, we leave it to
@@ -250,7 +251,7 @@ MFT_RECORD *map_extent_mft_record(ntfs_inode *base_ni, MFT_REF mref,
         int i;
         unsigned long mft_no = MREF(mref);
         u16 seq_no = MSEQNO(mref);
-       BOOL destroy_ni = FALSE;
+       bool destroy_ni = false;
  
         ntfs_debug("Mapping extent mft record 0x%lx (base mft record 0x%lx).",
                         mft_no, base_ni->mft_no);
@@ -261,7 +262,7 @@ MFT_RECORD *map_extent_mft_record(ntfs_inode *base_ni, MFT_REF mref,
          * in which case just return it. If not found, add it to the base
          * inode before returning it.
          */
-       down(&base_ni->extent_lock);
+       mutex_lock(&base_ni->extent_lock);
         if (base_ni->nr_extents > 0) {
                 extent_nis = base_ni->ext.extent_ntfs_inos;
                 for (i = 0; i < base_ni->nr_extents; i++) {
@@ -274,7 +275,7 @@ MFT_RECORD *map_extent_mft_record(ntfs_inode *base_ni, MFT_REF mref,
                 }
         }
         if (likely(ni != NULL)) {
-               up(&base_ni->extent_lock);
+               mutex_unlock(&base_ni->extent_lock);
                 atomic_dec(&base_ni->count);
                 /* We found the record; just have to map and return it. */
                 m = map_mft_record(ni);
@@ -301,7 +302,7 @@ map_err_out:
         /* Record wasn't there. Get a new ntfs inode and initialize it. */
         ni = ntfs_new_extent_inode(base_ni->vol->sb, mft_no);
         if (unlikely(!ni)) {
-               up(&base_ni->extent_lock);
+               mutex_unlock(&base_ni->extent_lock);
                 atomic_dec(&base_ni->count);
                 return ERR_PTR(-ENOMEM);
         }
@@ -312,7 +313,7 @@ map_err_out:
         /* Now map the record. */
         m = map_mft_record(ni);
         if (IS_ERR(m)) {
-               up(&base_ni->extent_lock);
+               mutex_unlock(&base_ni->extent_lock);
                 atomic_dec(&base_ni->count);
                 ntfs_clear_extent_inode(ni);
                 goto map_err_out;
@@ -321,7 +322,7 @@ map_err_out:
         if (seq_no && (le16_to_cpu(m->sequence_number) != seq_no)) {
                 ntfs_error(base_ni->vol->sb, "Found stale extent mft "
                                 "reference! Corrupt filesystem. Run chkdsk.");
-               destroy_ni = TRUE;
+               destroy_ni = true;
                 m = ERR_PTR(-EIO);
                 goto unm_err_out;
         }
@@ -330,11 +331,11 @@ map_err_out:
                 ntfs_inode **tmp;
                 int new_size = (base_ni->nr_extents + 4) * sizeof(ntfs_inode *);
  
-               tmp = (ntfs_inode **)kmalloc(new_size, GFP_NOFS);
+               tmp = kmalloc(new_size, GFP_NOFS);
                 if (unlikely(!tmp)) {
                         ntfs_error(base_ni->vol->sb, "Failed to allocate "
                                         "internal buffer.");
-                       destroy_ni = TRUE;
+                       destroy_ni = true;
                         m = ERR_PTR(-ENOMEM);
                         goto unm_err_out;
                 }
@@ -347,14 +348,14 @@ map_err_out:
                 base_ni->ext.extent_ntfs_inos = tmp;
         }
         base_ni->ext.extent_ntfs_inos[base_ni->nr_extents++] = ni;
-       up(&base_ni->extent_lock);
+       mutex_unlock(&base_ni->extent_lock);
         atomic_dec(&base_ni->count);
         ntfs_debug("Done 2.");
         *ntfs_ino = ni;
         return m;
  unm_err_out:
         unmap_mft_record(ni);
-       up(&base_ni->extent_lock);
+       mutex_unlock(&base_ni->extent_lock);
         atomic_dec(&base_ni->count);
         /*
          * If the extent inode was not attached to the base inode we need to
@@ -399,12 +400,12 @@ void __mark_mft_record_dirty(ntfs_inode *ni)
         BUG_ON(NInoAttr(ni));
         mark_ntfs_record_dirty(ni->page, ni->page_ofs);
         /* Determine the base vfs inode and mark it dirty, too. */
-       down(&ni->extent_lock);
+       mutex_lock(&ni->extent_lock);
         if (likely(ni->nr_extents >= 0))
                 base_ni = ni;
         else
                 base_ni = ni->ext.base_ntfs_ino;
-       up(&ni->extent_lock);
+       mutex_unlock(&ni->extent_lock);
         __mark_inode_dirty(VFS_I(base_ni), I_DIRTY_SYNC | I_DIRTY_DATASYNC);
  }
  
@@ -650,10 +651,7 @@ err_out:
   * fs/ntfs/aops.c::mark_ntfs_record_dirty().
   *
   * On success, clean the mft record and return 0.  On error, leave the mft
- * record dirty and return -errno.  The caller should call make_bad_inode() on
- * the base inode to ensure no more access happens to this inode.  We do not do
- * it here as the caller may want to finish writing other extent mft records
- * first to minimize on-disk metadata inconsistencies.
+ * record dirty and return -errno.
   *
   * NOTE:  We always perform synchronous i/o and ignore the @sync parameter.
   * However, if the mft record has a counterpart in the mft mirror and @sync is
@@ -859,7 +857,7 @@ err_out:
   * caller is responsible for unlocking the ntfs inode and unpinning the base
   * vfs inode.
   *
- * Return TRUE if the mft record may be written out and FALSE if not.
+ * Return 'true' if the mft record may be written out and 'false' if not.
   *
   * The caller has locked the page and cleared the uptodate flag on it which
   * means that we can safely write out any dirty mft records that do not have
@@ -870,7 +868,7 @@ err_out:
   * Here is a description of the tests we perform:
   *
   * If the inode is found in icache we know the mft record must be a base mft
- * record.  If it is dirty, we do not write it and return FALSE as the vfs
+ * record.  If it is dirty, we do not write it and return 'false' as the vfs
   * inode write paths will result in the access times being updated which would
   * cause the base mft record to be redirtied and written out again.  (We know
   * the access time update will modify the base mft record because Windows
@@ -879,11 +877,11 @@ err_out:
   *
   * If the inode is in icache and not dirty, we attempt to lock the mft record
   * and if we find the lock was already taken, it is not safe to write the mft
- * record and we return FALSE.
+ * record and we return 'false'.
   *
   * If we manage to obtain the lock we have exclusive access to the mft record,
   * which also allows us safe writeout of the mft record.  We then set
- * @locked_ni to the locked ntfs inode and return TRUE.
+ * @locked_ni to the locked ntfs inode and return 'true'.
   *
   * Note we cannot just lock the mft record and sleep while waiting for the lock
   * because this would deadlock due to lock reversal (normally the mft record is
@@ -893,24 +891,24 @@ err_out:
   * If the inode is not in icache we need to perform further checks.
   *
   * If the mft record is not a FILE record or it is a base mft record, we can
- * safely write it and return TRUE.
+ * safely write it and return 'true'.
   *
   * We now know the mft record is an extent mft record.  We check if the inode
   * corresponding to its base mft record is in icache and obtain a reference to
- * it if it is.  If it is not, we can safely write it and return TRUE.
+ * it if it is.  If it is not, we can safely write it and return 'true'.
   *
   * We now have the base inode for the extent mft record.  We check if it has an
   * ntfs inode for the extent mft record attached and if not it is safe to write
- * the extent mft record and we return TRUE.
+ * the extent mft record and we return 'true'.
   *
   * The ntfs inode for the extent mft record is attached to the base inode so we
   * attempt to lock the extent mft record and if we find the lock was already
- * taken, it is not safe to write the extent mft record and we return FALSE.
+ * taken, it is not safe to write the extent mft record and we return 'false'.
   *
   * If we manage to obtain the lock we have exclusive access to the extent mft
   * record, which also allows us safe writeout of the extent mft record.  We
   * set the ntfs inode of the extent mft record clean and then set @locked_ni to
- * the now locked ntfs inode and return TRUE.
+ * the now locked ntfs inode and return 'true'.
   *
   * Note, the reason for actually writing dirty mft records here and not just
   * relying on the vfs inode dirty code paths is that we can have mft records
@@ -924,7 +922,7 @@ err_out:
   * appear if the mft record is reused for a new inode before it got written
   * out.
   */
-BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
+bool ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
                 const MFT_RECORD *m, ntfs_inode **locked_ni)
  {
         struct super_block *sb = vol->sb;
@@ -979,16 +977,16 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
                                         mft_no);
                         atomic_dec(&ni->count);
                         iput(vi);
-                       return FALSE;
+                       return false;
                 }
                 ntfs_debug("Inode 0x%lx is not dirty.", mft_no);
                 /* The inode is not dirty, try to take the mft record lock. */
-               if (unlikely(down_trylock(&ni->mrec_lock))) {
+               if (unlikely(!mutex_trylock(&ni->mrec_lock))) {
                         ntfs_debug("Mft record 0x%lx is already locked, do "
                                         "not write it.", mft_no);
                         atomic_dec(&ni->count);
                         iput(vi);
-                       return FALSE;
+                       return false;
                 }
                 ntfs_debug("Managed to lock mft record 0x%lx, write it.",
                                 mft_no);
@@ -997,7 +995,7 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
                  * return the locked ntfs inode.
                  */
                 *locked_ni = ni;
-               return TRUE;
+               return true;
         }
         ntfs_debug("Inode 0x%lx is not in icache.", mft_no);
         /* The inode is not in icache. */
@@ -1005,13 +1003,13 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
         if (!ntfs_is_mft_record(m->magic)) {
                 ntfs_debug("Mft record 0x%lx is not a FILE record, write it.",
                                 mft_no);
-               return TRUE;
+               return true;
         }
         /* Write the mft record if it is a base inode. */
         if (!m->base_mft_record) {
                 ntfs_debug("Mft record 0x%lx is a base record, write it.",
                                 mft_no);
-               return TRUE;
+               return true;
         }
         /*
          * This is an extent mft record.  Check if the inode corresponding to
@@ -1035,7 +1033,7 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
                  */
                 ntfs_debug("Base inode 0x%lx is not in icache, write the "
                                 "extent record.", na.mft_no);
-               return TRUE;
+               return true;
         }
         ntfs_debug("Base inode 0x%lx is in icache.", na.mft_no);
         /*
@@ -1043,17 +1041,17 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
          * corresponding to this extent mft record attached.
          */
         ni = NTFS_I(vi);
-       down(&ni->extent_lock);
+       mutex_lock(&ni->extent_lock);
         if (ni->nr_extents <= 0) {
                 /*
                  * The base inode has no attached extent inodes, write this
                  * extent mft record.
                  */
-               up(&ni->extent_lock);
+               mutex_unlock(&ni->extent_lock);
                 iput(vi);
                 ntfs_debug("Base inode 0x%lx has no attached extent inodes, "
                                 "write the extent record.", na.mft_no);
-               return TRUE;
+               return true;
         }
         /* Iterate over the attached extent inodes. */
         extent_nis = ni->ext.extent_ntfs_inos;
@@ -1072,28 +1070,28 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
          * extent mft record.
          */
         if (!eni) {
-               up(&ni->extent_lock);
+               mutex_unlock(&ni->extent_lock);
                 iput(vi);
                 ntfs_debug("Extent inode 0x%lx is not attached to its base "
                                 "inode 0x%lx, write the extent record.",
                                 mft_no, na.mft_no);
-               return TRUE;
+               return true;
         }
         ntfs_debug("Extent inode 0x%lx is attached to its base inode 0x%lx.",
                         mft_no, na.mft_no);
         /* Take a reference to the extent ntfs inode. */
         atomic_inc(&eni->count);
-       up(&ni->extent_lock);
+       mutex_unlock(&ni->extent_lock);
         /*
          * Found the extent inode coresponding to this extent mft record.
          * Try to take the mft record lock.
          */
-       if (unlikely(down_trylock(&eni->mrec_lock))) {
+       if (unlikely(!mutex_trylock(&eni->mrec_lock))) {
                 atomic_dec(&eni->count);
                 iput(vi);
                 ntfs_debug("Extent mft record 0x%lx is already locked, do "
                                 "not write it.", mft_no);
-               return FALSE;
+               return false;
         }
         ntfs_debug("Managed to lock extent mft record 0x%lx, write it.",
                         mft_no);
@@ -1105,7 +1103,7 @@ BOOL ntfs_may_write_mft_record(ntfs_volume *vol, const unsigned long mft_no,
          * the locked extent ntfs inode.
          */
         *locked_ni = eni;
-       return TRUE;
+       return true;
  }
  
  static const char *es = "  Leaving inconsistent metadata.  Unmount and run "
@@ -1356,7 +1354,7 @@ static int ntfs_mft_bitmap_extend_allocation_nolock(ntfs_volume *vol)
                 ntfs_unmap_page(page);
                 /* Allocate a cluster from the DATA_ZONE. */
                 rl2 = ntfs_cluster_alloc(vol, rl[1].vcn, 1, lcn, DATA_ZONE,
-                               TRUE);
+                               true);
                 if (IS_ERR(rl2)) {
                         up_write(&mftbmp_ni->runlist.lock);
                         ntfs_error(vol->sb, "Failed to allocate a cluster for "
@@ -1726,7 +1724,7 @@ static int ntfs_mft_data_extend_allocation_nolock(ntfs_volume *vol)
         ATTR_RECORD *a = NULL;
         int ret, mp_size;
         u32 old_alen = 0;
-       BOOL mp_rebuilt = FALSE;
+       bool mp_rebuilt = false;
  
         ntfs_debug("Extending mft data allocation.");
         mft_ni = NTFS_I(vol->mft_ino);
@@ -1782,7 +1780,7 @@ static int ntfs_mft_data_extend_allocation_nolock(ntfs_volume *vol)
         old_last_vcn = rl[1].vcn;
         do {
                 rl2 = ntfs_cluster_alloc(vol, old_last_vcn, nr, lcn, MFT_ZONE,
-                               TRUE);
+                               true);
                 if (likely(!IS_ERR(rl2)))
                         break;
                 if (PTR_ERR(rl2) != -ENOSPC || nr == min_nr) {
@@ -1886,7 +1884,7 @@ static int ntfs_mft_data_extend_allocation_nolock(ntfs_volume *vol)
                 ret = -EOPNOTSUPP;
                 goto undo_alloc;
         }
-       mp_rebuilt = TRUE;
+       mp_rebuilt = true;
         /* Generate the mapping pairs array directly into the attr record. */
         ret = ntfs_mapping_pairs_build(vol, (u8*)a +
                         le16_to_cpu(a->data.non_resident.mapping_pairs_offset),
@@ -2257,7 +2255,7 @@ ntfs_inode *ntfs_mft_record_alloc(ntfs_volume *vol, const int mode,
         unsigned int ofs;
         int err;
         le16 seq_no, usn;
-       BOOL record_formatted = FALSE;
+       bool record_formatted = false;
  
         if (base_ni) {
                 ntfs_debug("Entering (allocating an extent mft record for "
@@ -2456,7 +2454,7 @@ have_alloc_rec:
                 mft_ni->initialized_size = new_initialized_size;
         }
         write_unlock_irqrestore(&mft_ni->size_lock, flags);
-       record_formatted = TRUE;
+       record_formatted = true;
         /* Update the mft data attribute record to reflect the new sizes. */
         m = map_mft_record(mft_ni);
         if (IS_ERR(m)) {
@@ -2639,11 +2637,6 @@ mft_rec_already_initialized:
                         goto undo_mftbmp_alloc;
                 }
                 vi->i_ino = bit;
-               /*
-                * This is the optimal IO size (for stat), not the fs block
-                * size.
-                */
-               vi->i_blksize = PAGE_CACHE_SIZE;
                 /*
                  * This is for checking whether an inode has changed w.r.t. a
                  * file so that the file can be updated if necessary (compare
@@ -2672,7 +2665,7 @@ mft_rec_already_initialized:
                         ni->name_len = 4;
  
                         ni->itype.index.block_size = 4096;
-                       ni->itype.index.block_size_bits = generic_ffs(4096) - 1;
+                       ni->itype.index.block_size_bits = ntfs_ffs(4096) - 1;
                         ni->itype.index.collation_rule = COLLATION_FILE_NAME;
                         if (vol->cluster_size <= ni->itype.index.block_size) {
                                 ni->itype.index.vcn_size = vol->cluster_size;
@@ -2711,7 +2704,7 @@ mft_rec_already_initialized:
                  * have its page mapped and it is very easy to do.
                  */
                 atomic_inc(&ni->count);
-               down(&ni->mrec_lock);
+               mutex_lock(&ni->mrec_lock);
                 ni->page = page;
                 ni->page_ofs = ofs;
                 /*
@@ -2798,22 +2791,22 @@ int ntfs_extent_mft_record_free(ntfs_inode *ni, MFT_RECORD *m)
         BUG_ON(NInoAttr(ni));
         BUG_ON(ni->nr_extents != -1);
  
-       down(&ni->extent_lock);
+       mutex_lock(&ni->extent_lock);
         base_ni = ni->ext.base_ntfs_ino;
-       up(&ni->extent_lock);
+       mutex_unlock(&ni->extent_lock);
  
         BUG_ON(base_ni->nr_extents <= 0);
  
         ntfs_debug("Entering for extent inode 0x%lx, base inode 0x%lx.\n",
                         mft_no, base_ni->mft_no);
  
-       down(&base_ni->extent_lock);
+       mutex_lock(&base_ni->extent_lock);
  
         /* Make sure we are holding the only reference to the extent inode. */
         if (atomic_read(&ni->count) > 2) {
                 ntfs_error(vol->sb, "Tried to free busy extent inode 0x%lx, "
                                 "not freeing.", base_ni->mft_no);
-               up(&base_ni->extent_lock);
+               mutex_unlock(&base_ni->extent_lock);
                 return -EBUSY;
         }
  
@@ -2831,7 +2824,7 @@ int ntfs_extent_mft_record_free(ntfs_inode *ni, MFT_RECORD *m)
                 break;
         }
  
-       up(&base_ni->extent_lock);
+       mutex_unlock(&base_ni->extent_lock);
  
         if (unlikely(err)) {
                 ntfs_error(vol->sb, "Extent inode 0x%lx is not attached to "
@@ -2890,16 +2883,16 @@ rollback_error:
         return 0;
  rollback:
         /* Rollback what we did... */
-       down(&base_ni->extent_lock);
+       mutex_lock(&base_ni->extent_lock);
         extent_nis = base_ni->ext.extent_ntfs_inos;
         if (!(base_ni->nr_extents & 3)) {
                 int new_size = (base_ni->nr_extents + 4) * sizeof(ntfs_inode*);
  
-               extent_nis = (ntfs_inode**)kmalloc(new_size, GFP_NOFS);
+               extent_nis = kmalloc(new_size, GFP_NOFS);
                 if (unlikely(!extent_nis)) {
                         ntfs_error(vol->sb, "Failed to allocate internal "
                                         "buffer during rollback.%s", es);
-                       up(&base_ni->extent_lock);
+                       mutex_unlock(&base_ni->extent_lock);
                         NVolSetErrors(vol);
                         goto rollback_error;
                 }
@@ -2914,7 +2907,7 @@ rollback:
         m->flags |= MFT_RECORD_IN_USE;
         m->sequence_number = old_seq_no;
         extent_nis[base_ni->nr_extents++] = ni;
-       up(&base_ni->extent_lock);
+       mutex_unlock(&base_ni->extent_lock);
         mark_mft_record_dirty(ni);
         return err;
  }