btrfs: zoned: write out partially allocated region

author Naohiro Aota <naohiro.aota@wdc.com>

Fri, 8 Jul 2022 23:18:49 +0000 (08:18 +0900)

committer David Sterba <dsterba@suse.com>

Mon, 25 Jul 2022 15:45:42 +0000 (17:45 +0200)
author Naohiro Aota <naohiro.aota@wdc.com>
Fri, 8 Jul 2022 23:18:49 +0000 (08:18 +0900)
committer David Sterba <dsterba@suse.com>
Mon, 25 Jul 2022 15:45:42 +0000 (17:45 +0200)
diff --git a/fs/btrfs/extent-tree.c b/fs/btrfs/extent-tree.c

index 5b604c3dc357ec313298a5c5a6371f8b7e1d4f83..ea3ec1e761e846fc4be8c6b46061e831f6ea4588 100644 (file)
--- a/fs/btrfs/extent-tree.c
+++ b/fs/btrfs/extent-tree.c
@@ -3996,6 +3996,16 @@ static int can_allocate_chunk_zoned(struct btrfs_fs_info *fs_info,
         if (ffe_ctl->max_extent_size >= ffe_ctl->min_alloc_size)
                 return -ENOSPC;
  
+       /*
+        * Even min_alloc_size is not left in any block groups. Since we cannot
+        * activate a new block group, allocating it may not help. Let's tell a
+        * caller to try again and hope it progress something by writing some
+        * parts of the region. That is only possible for data block groups,
+        * where a part of the region can be written.
+        */
+       if (ffe_ctl->flags & BTRFS_BLOCK_GROUP_DATA)
+               return -EAGAIN;
+
         /*
          * We cannot activate a new block group and no enough space left in any
          * block groups. So, allocating a new block group may not help. But,
diff --git a/fs/btrfs/inode.c b/fs/btrfs/inode.c

index 22e2597ce163a154cdc42c9af954c434adefd141..a8f9728355442173a6d94969a9553082e4e43fc5 100644 (file)
--- a/fs/btrfs/inode.c
+++ b/fs/btrfs/inode.c
@@ -117,7 +117,8 @@ static int btrfs_truncate(struct inode *inode, bool skip_writeback);
  static noinline int cow_file_range(struct btrfs_inode *inode,
                                    struct page *locked_page,
                                    u64 start, u64 end, int *page_started,
-                                  unsigned long *nr_written, int unlock);
+                                  unsigned long *nr_written, int unlock,
+                                  u64 *done_offset);
  static struct extent_map *create_io_em(struct btrfs_inode *inode, u64 start,
                                        u64 len, u64 orig_start, u64 block_start,
                                        u64 block_len, u64 orig_block_len,
@@ -921,7 +922,7 @@ static int submit_uncompressed_range(struct btrfs_inode *inode,
          * can directly submit them without interruption.
          */
         ret = cow_file_range(inode, locked_page, start, end, &page_started,
-                            &nr_written, 0);
+                            &nr_written, 0, NULL);
         /* Inline extent inserted, page gets unlocked and everything is done */
         if (page_started) {
                 ret = 0;
@@ -1170,7 +1171,8 @@ static u64 get_extent_allocation_hint(struct btrfs_inode *inode, u64 start,
  static noinline int cow_file_range(struct btrfs_inode *inode,
                                    struct page *locked_page,
                                    u64 start, u64 end, int *page_started,
-                                  unsigned long *nr_written, int unlock)
+                                  unsigned long *nr_written, int unlock,
+                                  u64 *done_offset)
  {
         struct btrfs_root *root = inode->root;
         struct btrfs_fs_info *fs_info = root->fs_info;
@@ -1363,6 +1365,21 @@ out_reserve:
         btrfs_dec_block_group_reservations(fs_info, ins.objectid);
         btrfs_free_reserved_extent(fs_info, ins.objectid, ins.offset, 1);
  out_unlock:
+       /*
+        * If done_offset is non-NULL and ret == -EAGAIN, we expect the
+        * caller to write out the successfully allocated region and retry.
+        */
+       if (done_offset && ret == -EAGAIN) {
+               if (orig_start < start)
+                       *done_offset = start - 1;
+               else
+                       *done_offset = start;
+               return ret;
+       } else if (ret == -EAGAIN) {
+               /* Convert to -ENOSPC since the caller cannot retry. */
+               ret = -ENOSPC;
+       }
+
         /*
          * Now, we have three regions to clean up:
          *
@@ -1608,19 +1625,37 @@ static noinline int run_delalloc_zoned(struct btrfs_inode *inode,
                                        u64 end, int *page_started,
                                        unsigned long *nr_written)
  {
+       u64 done_offset = end;
         int ret;
+       bool locked_page_done = false;
  
-       ret = cow_file_range(inode, locked_page, start, end, page_started,
-                            nr_written, 0);
-       if (ret)
-               return ret;
+       while (start <= end) {
+               ret = cow_file_range(inode, locked_page, start, end, page_started,
+                                    nr_written, 0, &done_offset);
+               if (ret && ret != -EAGAIN)
+                       return ret;
  
-       if (*page_started)
-               return 0;
+               if (*page_started) {
+                       ASSERT(ret == 0);
+                       return 0;
+               }
+
+               if (ret == 0)
+                       done_offset = end;
+
+               if (done_offset == start)
+                       return -ENOSPC;
+
+               if (!locked_page_done) {
+                       __set_page_dirty_nobuffers(locked_page);
+                       account_page_redirty(locked_page);
+               }
+               locked_page_done = true;
+               extent_write_locked_range(&inode->vfs_inode, start, done_offset);
+
+               start = done_offset + 1;
+       }
  
-       __set_page_dirty_nobuffers(locked_page);
-       account_page_redirty(locked_page);
-       extent_write_locked_range(&inode->vfs_inode, start, end);
         *page_started = 1;
  
         return 0;
@@ -1712,7 +1747,7 @@ static int fallback_to_cow(struct btrfs_inode *inode, struct page *locked_page,
         }
  
         return cow_file_range(inode, locked_page, start, end, page_started,
-                             nr_written, 1);
+                             nr_written, 1, NULL);
  }
  
  struct can_nocow_file_extent_args {
@@ -2185,7 +2220,7 @@ int btrfs_run_delalloc_range(struct btrfs_inode *inode, struct page *locked_page
                                                  page_started, nr_written);
                 else
                         ret = cow_file_range(inode, locked_page, start, end,
-                                            page_started, nr_written, 1);
+                                            page_started, nr_written, 1, NULL);
         } else {
                 set_bit(BTRFS_INODE_HAS_ASYNC_EXTENT, &inode->runtime_flags);
                 ret = cow_file_range_async(inode, wbc, locked_page, start, end,
author	Naohiro Aota <naohiro.aota@wdc.com>
	Fri, 8 Jul 2022 23:18:49 +0000 (08:18 +0900)
committer	David Sterba <dsterba@suse.com>
	Mon, 25 Jul 2022 15:45:42 +0000 (17:45 +0200)
fs/btrfs/extent-tree.c		patch \| blob \| history
fs/btrfs/inode.c		patch \| blob \| history