btrfs: fix RWF_NOWAIT writes blocking on extent locks and waiting for IO

author Filipe Manana <fdmanana@suse.com>

Mon, 15 Jun 2020 17:49:39 +0000 (18:49 +0100)

committer David Sterba <dsterba@suse.com>

Tue, 16 Jun 2020 17:22:45 +0000 (19:22 +0200)
author Filipe Manana <fdmanana@suse.com>
Mon, 15 Jun 2020 17:49:39 +0000 (18:49 +0100)
committer David Sterba <dsterba@suse.com>
Tue, 16 Jun 2020 17:22:45 +0000 (19:22 +0200)
diff --git a/fs/btrfs/file.c b/fs/btrfs/file.c

index 6d5d905..2520605 100644 (file)
--- a/fs/btrfs/file.c
+++ b/fs/btrfs/file.c
@@ -1533,7 +1533,7 @@ lock_and_cleanup_extent_if_need(struct btrfs_inode *inode, struct page **pages,
  }
  
  static noinline int check_can_nocow(struct btrfs_inode *inode, loff_t pos,
-                                   size_t *write_bytes)
+                                   size_t *write_bytes, bool nowait)
  {
         struct btrfs_fs_info *fs_info = inode->root->fs_info;
         struct btrfs_root *root = inode->root;
@@ -1541,27 +1541,43 @@ static noinline int check_can_nocow(struct btrfs_inode *inode, loff_t pos,
         u64 num_bytes;
         int ret;
  
-       if (!btrfs_drew_try_write_lock(&root->snapshot_lock))
+       if (!nowait && !btrfs_drew_try_write_lock(&root->snapshot_lock))
                 return -EAGAIN;
  
         lockstart = round_down(pos, fs_info->sectorsize);
         lockend = round_up(pos + *write_bytes,
                            fs_info->sectorsize) - 1;
+       num_bytes = lockend - lockstart + 1;
  
-       btrfs_lock_and_flush_ordered_range(inode, lockstart,
-                                          lockend, NULL);
+       if (nowait) {
+               struct btrfs_ordered_extent *ordered;
+
+               if (!try_lock_extent(&inode->io_tree, lockstart, lockend))
+                       return -EAGAIN;
+
+               ordered = btrfs_lookup_ordered_range(inode, lockstart,
+                                                    num_bytes);
+               if (ordered) {
+                       btrfs_put_ordered_extent(ordered);
+                       ret = -EAGAIN;
+                       goto out_unlock;
+               }
+       } else {
+               btrfs_lock_and_flush_ordered_range(inode, lockstart,
+                                                  lockend, NULL);
+       }
  
-       num_bytes = lockend - lockstart + 1;
         ret = can_nocow_extent(&inode->vfs_inode, lockstart, &num_bytes,
                         NULL, NULL, NULL);
         if (ret <= 0) {
                 ret = 0;
-               btrfs_drew_write_unlock(&root->snapshot_lock);
+               if (!nowait)
+                       btrfs_drew_write_unlock(&root->snapshot_lock);
         } else {
                 *write_bytes = min_t(size_t, *write_bytes ,
                                      num_bytes - pos + lockstart);
         }
-
+out_unlock:
         unlock_extent(&inode->io_tree, lockstart, lockend);
  
         return ret;
@@ -1633,7 +1649,7 @@ static noinline ssize_t btrfs_buffered_write(struct kiocb *iocb,
                         if ((BTRFS_I(inode)->flags & (BTRFS_INODE_NODATACOW |
                                                       BTRFS_INODE_PREALLOC)) &&
                             check_can_nocow(BTRFS_I(inode), pos,
-                                       &write_bytes) > 0) {
+                                           &write_bytes, false) > 0) {
                                 /*
                                  * For nodata cow case, no need to reserve
                                  * data space.
@@ -1912,12 +1928,11 @@ static ssize_t btrfs_file_write_iter(struct kiocb *iocb,
                  */
                 if (!(BTRFS_I(inode)->flags & (BTRFS_INODE_NODATACOW |
                                               BTRFS_INODE_PREALLOC)) ||
-                   check_can_nocow(BTRFS_I(inode), pos, &nocow_bytes) <= 0) {
+                   check_can_nocow(BTRFS_I(inode), pos, &nocow_bytes,
+                                   true) <= 0) {
                         inode_unlock(inode);
                         return -EAGAIN;
                 }
-               /* check_can_nocow() locks the snapshot lock on success */
-               btrfs_drew_write_unlock(&root->snapshot_lock);
                 /*
                  * There are holes in the range or parts of the range that must
                  * be COWed (shared extents, RO block groups, etc), so just bail
author	Filipe Manana <fdmanana@suse.com>
	Mon, 15 Jun 2020 17:49:39 +0000 (18:49 +0100)
committer	David Sterba <dsterba@suse.com>
	Tue, 16 Jun 2020 17:22:45 +0000 (19:22 +0200)