[XFS] get_bulkall() could return incorrect inode state

author Vlad Apostolov <vapo@sgi.com>

Thu, 11 Oct 2007 07:44:18 +0000 (17:44 +1000)

committer Tim Shimmin <tes@chook.melbourne.sgi.com>

Tue, 16 Oct 2007 02:21:15 +0000 (12:21 +1000)
author Vlad Apostolov <vapo@sgi.com>
Thu, 11 Oct 2007 07:44:18 +0000 (17:44 +1000)
committer Tim Shimmin <tes@chook.melbourne.sgi.com>
Tue, 16 Oct 2007 02:21:15 +0000 (12:21 +1000)
diff --git a/fs/xfs/xfs_inode.c b/fs/xfs/xfs_inode.c

index 3d8ba8fec19161f75ab7dda9ec426da65d42f62c..abf509a88915e95aae00dcebec502170b1280b38 100644 (file)
--- a/fs/xfs/xfs_inode.c
+++ b/fs/xfs/xfs_inode.c
@@ -1931,9 +1931,9 @@ xfs_iunlink(
          */
         error = xfs_trans_read_buf(mp, tp, mp->m_ddev_targp, agdaddr,
                                    XFS_FSS_TO_BB(mp, 1), 0, &agibp);
-       if (error) {
+       if (error)
                 return error;
-       }
+
         /*
          * Validate the magic number of the agi block.
          */
@@ -1957,6 +1957,24 @@ xfs_iunlink(
         ASSERT(agi->agi_unlinked[bucket_index]);
         ASSERT(be32_to_cpu(agi->agi_unlinked[bucket_index]) != agino);
  
+       error = xfs_itobp(mp, tp, ip, &dip, &ibp, 0, 0);
+       if (error)
+               return error;
+
+       /*
+        * Clear the on-disk di_nlink. This is to prevent xfs_bulkstat
+        * from picking up this inode when it is reclaimed (its incore state
+        * initialzed but not flushed to disk yet). The in-core di_nlink is
+        * already cleared in xfs_droplink() and a corresponding transaction
+        * logged. The hack here just synchronizes the in-core to on-disk
+        * di_nlink value in advance before the actual inode sync to disk.
+        * This is OK because the inode is already unlinked and would never
+        * change its di_nlink again for this inode generation.
+        * This is a temporary hack that would require a proper fix
+        * in the future.
+        */
+       dip->di_core.di_nlink = 0;
+
         if (be32_to_cpu(agi->agi_unlinked[bucket_index]) != NULLAGINO) {
                 /*
                  * There is already another inode in the bucket we need
@@ -1964,10 +1982,6 @@ xfs_iunlink(
                  * Here we put the head pointer into our next pointer,
                  * and then we fall through to point the head at us.
                  */
-               error = xfs_itobp(mp, tp, ip, &dip, &ibp, 0, 0);
-               if (error) {
-                       return error;
-               }
                 ASSERT(be32_to_cpu(dip->di_next_unlinked) == NULLAGINO);
                 /* both on-disk, don't endian flip twice */
                 dip->di_next_unlinked = agi->agi_unlinked[bucket_index];
diff --git a/fs/xfs/xfs_itable.c b/fs/xfs/xfs_itable.c

index efeeafe275b97fe9f897d520ec1384837329365b..1edd9afb664b062ab2346a490e4e5f21c96454d4 100644 (file)
--- a/fs/xfs/xfs_itable.c
+++ b/fs/xfs/xfs_itable.c
@@ -290,8 +290,16 @@ xfs_bulkstat_use_dinode(
                 return 1;
         dip = (xfs_dinode_t *)
                         xfs_buf_offset(bp, clustidx << mp->m_sb.sb_inodelog);
+       /*
+        * Check the buffer containing the on-disk inode for di_nlink == 0.
+        * This is to prevent xfs_bulkstat from picking up just reclaimed
+        * inodes that have their in-core state initialized but not flushed
+        * to disk yet. This is a temporary hack that would require a proper
+        * fix in the future.
+        */
         if (be16_to_cpu(dip->di_core.di_magic) != XFS_DINODE_MAGIC ||
-           !XFS_DINODE_GOOD_VERSION(dip->di_core.di_version))
+           !XFS_DINODE_GOOD_VERSION(dip->di_core.di_version) ||
+           !dip->di_core.di_nlink)
                 return 0;
         if (flags & BULKSTAT_FG_QUICK) {
                 *dipp = dip;
author	Vlad Apostolov <vapo@sgi.com>
	Thu, 11 Oct 2007 07:44:18 +0000 (17:44 +1000)
committer	Tim Shimmin <tes@chook.melbourne.sgi.com>
	Tue, 16 Oct 2007 02:21:15 +0000 (12:21 +1000)
fs/xfs/xfs_inode.c		patch \| blob \| history
fs/xfs/xfs_itable.c		patch \| blob \| history