btrfs: Remove fs_info from btrfs_alloc_logged_file_extent

[sfrench/cifs-2.6.git] / fs / btrfs / tree-log.c
diff --git a/fs/btrfs/tree-log.c b/fs/btrfs/tree-log.c

index 8f23a94dab770c00933f39a4ed1fb845edac22dd..b3b1d424f2d8be3328c5a50afc464fc33777a20d 100644 (file)
--- a/fs/btrfs/tree-log.c
+++ b/fs/btrfs/tree-log.c
@@ -222,11 +222,8 @@ int btrfs_pin_log_trans(struct btrfs_root *root)
  void btrfs_end_log_trans(struct btrfs_root *root)
  {
         if (atomic_dec_and_test(&root->log_writers)) {
-               /*
-                * Implicit memory barrier after atomic_dec_and_test
-                */
-               if (waitqueue_active(&root->log_writer_wait))
-                       wake_up(&root->log_writer_wait);
+               /* atomic_dec_and_test implies a barrier */
+               cond_wake_up_nomb(&root->log_writer_wait);
         }
  }
  
@@ -718,7 +715,6 @@ static noinline int replay_one_extent(struct btrfs_trans_handle *trans,
                                  * allocation tree
                                  */
                                 ret = btrfs_alloc_logged_file_extent(trans,
-                                               fs_info,
                                                 root->root_key.objectid,
                                                 key->objectid, offset, &ins);
                                 if (ret)
@@ -2936,7 +2932,6 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
         /* bail out if we need to do a full commit */
         if (btrfs_need_log_full_commit(fs_info, trans)) {
                 ret = -EAGAIN;
-               btrfs_free_logged_extents(log, log_transid);
                 mutex_unlock(&root->log_mutex);
                 goto out;
         }
@@ -2954,7 +2949,6 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
         if (ret) {
                 blk_finish_plug(&plug);
                 btrfs_abort_transaction(trans, ret);
-               btrfs_free_logged_extents(log, log_transid);
                 btrfs_set_log_full_commit(fs_info, trans);
                 mutex_unlock(&root->log_mutex);
                 goto out;
@@ -2988,11 +2982,8 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
  
         mutex_lock(&log_root_tree->log_mutex);
         if (atomic_dec_and_test(&log_root_tree->log_writers)) {
-               /*
-                * Implicit memory barrier after atomic_dec_and_test
-                */
-               if (waitqueue_active(&log_root_tree->log_writer_wait))
-                       wake_up(&log_root_tree->log_writer_wait);
+               /* atomic_dec_and_test implies a barrier */
+               cond_wake_up_nomb(&log_root_tree->log_writer_wait);
         }
  
         if (ret) {
@@ -3008,7 +2999,6 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
                         goto out;
                 }
                 btrfs_wait_tree_log_extents(log, mark);
-               btrfs_free_logged_extents(log, log_transid);
                 mutex_unlock(&log_root_tree->log_mutex);
                 ret = -EAGAIN;
                 goto out;
@@ -3026,7 +3016,6 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
         if (atomic_read(&log_root_tree->log_commit[index2])) {
                 blk_finish_plug(&plug);
                 ret = btrfs_wait_tree_log_extents(log, mark);
-               btrfs_wait_logged_extents(trans, log, log_transid);
                 wait_log_commit(log_root_tree,
                                 root_log_ctx.log_transid);
                 mutex_unlock(&log_root_tree->log_mutex);
@@ -3051,7 +3040,6 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
         if (btrfs_need_log_full_commit(fs_info, trans)) {
                 blk_finish_plug(&plug);
                 btrfs_wait_tree_log_extents(log, mark);
-               btrfs_free_logged_extents(log, log_transid);
                 mutex_unlock(&log_root_tree->log_mutex);
                 ret = -EAGAIN;
                 goto out_wake_log_root;
@@ -3064,7 +3052,6 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
         if (ret) {
                 btrfs_set_log_full_commit(fs_info, trans);
                 btrfs_abort_transaction(trans, ret);
-               btrfs_free_logged_extents(log, log_transid);
                 mutex_unlock(&log_root_tree->log_mutex);
                 goto out_wake_log_root;
         }
@@ -3074,11 +3061,9 @@ int btrfs_sync_log(struct btrfs_trans_handle *trans,
                                                   EXTENT_NEW | EXTENT_DIRTY);
         if (ret) {
                 btrfs_set_log_full_commit(fs_info, trans);
-               btrfs_free_logged_extents(log, log_transid);
                 mutex_unlock(&log_root_tree->log_mutex);
                 goto out_wake_log_root;
         }
-       btrfs_wait_logged_extents(trans, log, log_transid);
  
         btrfs_set_super_log_root(fs_info->super_for_commit,
                                  log_root_tree->node->start);
@@ -3116,10 +3101,11 @@ out_wake_log_root:
         mutex_unlock(&log_root_tree->log_mutex);
  
         /*
-        * The barrier before waitqueue_active is implied by mutex_unlock
+        * The barrier before waitqueue_active (in cond_wake_up) is needed so
+        * all the updates above are seen by the woken threads. It might not be
+        * necessary, but proving that seems to be hard.
          */
-       if (waitqueue_active(&log_root_tree->log_commit_wait[index2]))
-               wake_up(&log_root_tree->log_commit_wait[index2]);
+       cond_wake_up(&log_root_tree->log_commit_wait[index2]);
  out:
         mutex_lock(&root->log_mutex);
         btrfs_remove_all_log_ctxs(root, index1, ret);
@@ -3128,10 +3114,11 @@ out:
         mutex_unlock(&root->log_mutex);
  
         /*
-        * The barrier before waitqueue_active is implied by mutex_unlock
+        * The barrier before waitqueue_active (in cond_wake_up) is needed so
+        * all the updates above are seen by the woken threads. It might not be
+        * necessary, but proving that seems to be hard.
          */
-       if (waitqueue_active(&root->log_commit_wait[index1]))
-               wake_up(&root->log_commit_wait[index1]);
+       cond_wake_up(&root->log_commit_wait[index1]);
         return ret;
  }
  
@@ -3163,14 +3150,6 @@ static void free_log_tree(struct btrfs_trans_handle *trans,
                                   EXTENT_DIRTY | EXTENT_NEW | EXTENT_NEED_WAIT);
         }
  
-       /*
-        * We may have short-circuited the log tree with the full commit logic
-        * and left ordered extents on our list, so clear these out to keep us
-        * from leaking inodes and memory.
-        */
-       btrfs_free_logged_extents(log, 0);
-       btrfs_free_logged_extents(log, 1);
-
         free_extent_buffer(log->node);
         kfree(log);
  }
@@ -4082,131 +4061,32 @@ static int extent_cmp(void *priv, struct list_head *a, struct list_head *b)
         return 0;
  }
  
-static int wait_ordered_extents(struct btrfs_trans_handle *trans,
-                               struct inode *inode,
-                               struct btrfs_root *root,
-                               const struct extent_map *em,
-                               const struct list_head *logged_list,
-                               bool *ordered_io_error)
+static int log_extent_csums(struct btrfs_trans_handle *trans,
+                           struct btrfs_inode *inode,
+                           struct btrfs_root *log_root,
+                           const struct extent_map *em)
  {
-       struct btrfs_fs_info *fs_info = root->fs_info;
-       struct btrfs_ordered_extent *ordered;
-       struct btrfs_root *log = root->log_root;
-       u64 mod_start = em->mod_start;
-       u64 mod_len = em->mod_len;
-       const bool skip_csum = BTRFS_I(inode)->flags & BTRFS_INODE_NODATASUM;
         u64 csum_offset;
         u64 csum_len;
         LIST_HEAD(ordered_sums);
         int ret = 0;
  
-       *ordered_io_error = false;
-
-       if (test_bit(EXTENT_FLAG_PREALLOC, &em->flags) ||
+       if (inode->flags & BTRFS_INODE_NODATASUM ||
+           test_bit(EXTENT_FLAG_PREALLOC, &em->flags) ||
             em->block_start == EXTENT_MAP_HOLE)
                 return 0;
  
-       /*
-        * Wait far any ordered extent that covers our extent map. If it
-        * finishes without an error, first check and see if our csums are on
-        * our outstanding ordered extents.
-        */
-       list_for_each_entry(ordered, logged_list, log_list) {
-               struct btrfs_ordered_sum *sum;
-
-               if (!mod_len)
-                       break;
-
-               if (ordered->file_offset + ordered->len <= mod_start ||
-                   mod_start + mod_len <= ordered->file_offset)
-                       continue;
-
-               if (!test_bit(BTRFS_ORDERED_IO_DONE, &ordered->flags) &&
-                   !test_bit(BTRFS_ORDERED_IOERR, &ordered->flags) &&
-                   !test_bit(BTRFS_ORDERED_DIRECT, &ordered->flags)) {
-                       const u64 start = ordered->file_offset;
-                       const u64 end = ordered->file_offset + ordered->len - 1;
-
-                       WARN_ON(ordered->inode != inode);
-                       filemap_fdatawrite_range(inode->i_mapping, start, end);
-               }
-
-               wait_event(ordered->wait,
-                          (test_bit(BTRFS_ORDERED_IO_DONE, &ordered->flags) ||
-                           test_bit(BTRFS_ORDERED_IOERR, &ordered->flags)));
-
-               if (test_bit(BTRFS_ORDERED_IOERR, &ordered->flags)) {
-                       /*
-                        * Clear the AS_EIO/AS_ENOSPC flags from the inode's
-                        * i_mapping flags, so that the next fsync won't get
-                        * an outdated io error too.
-                        */
-                       filemap_check_errors(inode->i_mapping);
-                       *ordered_io_error = true;
-                       break;
-               }
-               /*
-                * We are going to copy all the csums on this ordered extent, so
-                * go ahead and adjust mod_start and mod_len in case this
-                * ordered extent has already been logged.
-                */
-               if (ordered->file_offset > mod_start) {
-                       if (ordered->file_offset + ordered->len >=
-                           mod_start + mod_len)
-                               mod_len = ordered->file_offset - mod_start;
-                       /*
-                        * If we have this case
-                        *
-                        * |--------- logged extent ---------|
-                        *       |----- ordered extent ----|
-                        *
-                        * Just don't mess with mod_start and mod_len, we'll
-                        * just end up logging more csums than we need and it
-                        * will be ok.
-                        */
-               } else {
-                       if (ordered->file_offset + ordered->len <
-                           mod_start + mod_len) {
-                               mod_len = (mod_start + mod_len) -
-                                       (ordered->file_offset + ordered->len);
-                               mod_start = ordered->file_offset +
-                                       ordered->len;
-                       } else {
-                               mod_len = 0;
-                       }
-               }
-
-               if (skip_csum)
-                       continue;
-
-               /*
-                * To keep us from looping for the above case of an ordered
-                * extent that falls inside of the logged extent.
-                */
-               if (test_and_set_bit(BTRFS_ORDERED_LOGGED_CSUM,
-                                    &ordered->flags))
-                       continue;
-
-               list_for_each_entry(sum, &ordered->list, list) {
-                       ret = btrfs_csum_file_blocks(trans, log, sum);
-                       if (ret)
-                               break;
-               }
-       }
-
-       if (*ordered_io_error || !mod_len || ret || skip_csum)
-               return ret;
-
+       /* If we're compressed we have to save the entire range of csums. */
         if (em->compress_type) {
                 csum_offset = 0;
                 csum_len = max(em->block_len, em->orig_block_len);
         } else {
-               csum_offset = mod_start - em->start;
-               csum_len = mod_len;
+               csum_offset = em->mod_start - em->start;
+               csum_len = em->mod_len;
         }
  
         /* block start is already adjusted for the file extent offset. */
-       ret = btrfs_lookup_csums_range(fs_info->csum_root,
+       ret = btrfs_lookup_csums_range(trans->fs_info->csum_root,
                                        em->block_start + csum_offset,
                                        em->block_start + csum_offset +
                                        csum_len - 1, &ordered_sums, 0);
@@ -4218,7 +4098,7 @@ static int wait_ordered_extents(struct btrfs_trans_handle *trans,
                                                    struct btrfs_ordered_sum,
                                                    list);
                 if (!ret)
-                       ret = btrfs_csum_file_blocks(trans, log, sums);
+                       ret = btrfs_csum_file_blocks(trans, log_root, sums);
                 list_del(&sums->list);
                 kfree(sums);
         }
@@ -4230,7 +4110,6 @@ static int log_one_extent(struct btrfs_trans_handle *trans,
                           struct btrfs_inode *inode, struct btrfs_root *root,
                           const struct extent_map *em,
                           struct btrfs_path *path,
-                         const struct list_head *logged_list,
                           struct btrfs_log_ctx *ctx)
  {
         struct btrfs_root *log = root->log_root;
@@ -4242,18 +4121,11 @@ static int log_one_extent(struct btrfs_trans_handle *trans,
         u64 block_len;
         int ret;
         int extent_inserted = 0;
-       bool ordered_io_err = false;
  
-       ret = wait_ordered_extents(trans, &inode->vfs_inode, root, em,
-                       logged_list, &ordered_io_err);
+       ret = log_extent_csums(trans, inode, log, em);
         if (ret)
                 return ret;
  
-       if (ordered_io_err) {
-               ctx->io_err = -EIO;
-               return ctx->io_err;
-       }
-
         btrfs_init_map_token(&token);
  
         ret = __btrfs_drop_extents(trans, log, &inode->vfs_inode, path, em->start,
@@ -4428,7 +4300,6 @@ static int btrfs_log_changed_extents(struct btrfs_trans_handle *trans,
                                      struct btrfs_root *root,
                                      struct btrfs_inode *inode,
                                      struct btrfs_path *path,
-                                    struct list_head *logged_list,
                                      struct btrfs_log_ctx *ctx,
                                      const u64 start,
                                      const u64 end)
@@ -4484,20 +4355,6 @@ static int btrfs_log_changed_extents(struct btrfs_trans_handle *trans,
         }
  
         list_sort(NULL, &extents, extent_cmp);
-       btrfs_get_logged_extents(inode, logged_list, logged_start, logged_end);
-       /*
-        * Some ordered extents started by fsync might have completed
-        * before we could collect them into the list logged_list, which
-        * means they're gone, not in our logged_list nor in the inode's
-        * ordered tree. We want the application/user space to know an
-        * error happened while attempting to persist file data so that
-        * it can take proper action. If such error happened, we leave
-        * without writing to the log tree and the fsync must report the
-        * file data write error and not commit the current transaction.
-        */
-       ret = filemap_check_errors(inode->vfs_inode.i_mapping);
-       if (ret)
-               ctx->io_err = ret;
  process:
         while (!list_empty(&extents)) {
                 em = list_entry(extents.next, struct extent_map, list);
@@ -4516,8 +4373,7 @@ process:
  
                 write_unlock(&tree->lock);
  
-               ret = log_one_extent(trans, inode, root, em, path, logged_list,
-                                    ctx);
+               ret = log_one_extent(trans, inode, root, em, path, ctx);
                 write_lock(&tree->lock);
                 clear_em_logging(tree, em);
                 free_extent_map(em);
@@ -4902,7 +4758,6 @@ static int btrfs_log_inode(struct btrfs_trans_handle *trans,
         struct btrfs_key min_key;
         struct btrfs_key max_key;
         struct btrfs_root *log = root->log_root;
-       LIST_HEAD(logged_list);
         u64 last_extent = 0;
         int err = 0;
         int ret;
@@ -5239,7 +5094,7 @@ log_extents:
         }
         if (fast_search) {
                 ret = btrfs_log_changed_extents(trans, root, inode, dst_path,
-                                               &logged_list, ctx, start, end);
+                                               ctx, start, end);
                 if (ret) {
                         err = ret;
                         goto out_unlock;
@@ -5290,10 +5145,6 @@ log_extents:
         inode->last_log_commit = inode->last_sub_trans;
         spin_unlock(&inode->lock);
  out_unlock:
-       if (unlikely(err))
-               btrfs_put_logged_extents(&logged_list);
-       else
-               btrfs_submit_logged_extents(&logged_list, log);
         mutex_unlock(&inode->log_mutex);
  
         btrfs_free_path(path);