jbd: Issue cache flush after checkpointing

author Jan Kara <jack@suse.cz>

Fri, 25 Nov 2011 23:35:39 +0000 (00:35 +0100)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Fri, 3 Feb 2012 17:21:32 +0000 (09:21 -0800)
author Jan Kara <jack@suse.cz>
Fri, 25 Nov 2011 23:35:39 +0000 (00:35 +0100)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Fri, 3 Feb 2012 17:21:32 +0000 (09:21 -0800)
diff --git a/fs/jbd/checkpoint.c b/fs/jbd/checkpoint.c

index f94fc48..5c93ffc 100644 (file)
--- a/fs/jbd/checkpoint.c
+++ b/fs/jbd/checkpoint.c
@@ -453,8 +453,6 @@ out:
   *
   * Return <0 on error, 0 on success, 1 if there was nothing to clean up.
   *
- * Called with the journal lock held.
- *
   * This is the only part of the journaling code which really needs to be
   * aware of transaction aborts.  Checkpointing involves writing to the
   * main filesystem area rather than to the journal, so it can proceed
@@ -472,13 +470,14 @@ int cleanup_journal_tail(journal_t *journal)
         if (is_journal_aborted(journal))
                 return 1;
  
-       /* OK, work out the oldest transaction remaining in the log, and
+       /*
+        * OK, work out the oldest transaction remaining in the log, and
          * the log block it starts at.
          *
          * If the log is now empty, we need to work out which is the
          * next transaction ID we will write, and where it will
-        * start. */
-
+        * start.
+        */
         spin_lock(&journal->j_state_lock);
         spin_lock(&journal->j_list_lock);
         transaction = journal->j_checkpoint_transactions;
@@ -504,7 +503,25 @@ int cleanup_journal_tail(journal_t *journal)
                 spin_unlock(&journal->j_state_lock);
                 return 1;
         }
+       spin_unlock(&journal->j_state_lock);
+
+       /*
+        * We need to make sure that any blocks that were recently written out
+        * --- perhaps by log_do_checkpoint() --- are flushed out before we
+        * drop the transactions from the journal. It's unlikely this will be
+        * necessary, especially with an appropriately sized journal, but we
+        * need this to guarantee correctness.  Fortunately
+        * cleanup_journal_tail() doesn't get called all that often.
+        */
+       if (journal->j_flags & JFS_BARRIER)
+               blkdev_issue_flush(journal->j_fs_dev, GFP_KERNEL, NULL);
  
+       spin_lock(&journal->j_state_lock);
+       if (!tid_gt(first_tid, journal->j_tail_sequence)) {
+               spin_unlock(&journal->j_state_lock);
+               /* Someone else cleaned up journal so return 0 */
+               return 0;
+       }
         /* OK, update the superblock to recover the freed space.
          * Physical blocks come first: have we wrapped beyond the end of
          * the log?  */
diff --git a/fs/jbd/recovery.c b/fs/jbd/recovery.c

index 5b43e96..008bf06 100644 (file)
--- a/fs/jbd/recovery.c
+++ b/fs/jbd/recovery.c
@@ -20,6 +20,7 @@
  #include <linux/fs.h>
  #include <linux/jbd.h>
  #include <linux/errno.h>
+#include <linux/blkdev.h>
  #endif
  
  /*
@@ -263,6 +264,9 @@ int journal_recover(journal_t *journal)
         err2 = sync_blockdev(journal->j_fs_dev);
         if (!err)
                 err = err2;
+       /* Flush disk caches to get replayed data on the permanent storage */
+       if (journal->j_flags & JFS_BARRIER)
+               blkdev_issue_flush(journal->j_fs_dev, GFP_KERNEL, NULL);
  
         return err;
  }
author	Jan Kara <jack@suse.cz>
	Fri, 25 Nov 2011 23:35:39 +0000 (00:35 +0100)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Fri, 3 Feb 2012 17:21:32 +0000 (09:21 -0800)
fs/jbd/checkpoint.c		patch \| blob \| history
fs/jbd/recovery.c		patch \| blob \| history