]> www.infradead.org Git - users/dwmw2/linux.git/commitdiff
btrfs: track ordered bytes instead of just dio ordered bytes
authorJosef Bacik <josef@toxicpanda.com>
Fri, 9 Oct 2020 13:28:20 +0000 (09:28 -0400)
committerDavid Sterba <dsterba@suse.com>
Mon, 8 Feb 2021 21:58:58 +0000 (22:58 +0100)
We track dio_bytes because the shrink delalloc code needs to know if we
have more DIO in flight than we have normal buffered IO.  The reason for
this is because we can't "flush" DIO, we have to just wait on the
ordered extents to finish.

However this is true of all ordered extents.  If we have more ordered
space outstanding than dirty pages we should be waiting on ordered
extents.  We already are ok on this front technically, because we always
do a FLUSH_DELALLOC_WAIT loop, but I want to use the ordered counter in
the preemptive flushing code as well, so change this to count all
ordered bytes instead of just DIO ordered bytes.

Reviewed-by: Nikolay Borisov <nborisov@suse.com>
Signed-off-by: Josef Bacik <josef@toxicpanda.com>
Signed-off-by: David Sterba <dsterba@suse.com>
fs/btrfs/ctree.h
fs/btrfs/disk-io.c
fs/btrfs/ordered-data.c
fs/btrfs/space-info.c

index ed6bb46a2572e13e9ddace1464be3024f1ca08e0..7d8660227520ec7060f0ee12bd06d25759aed298 100644 (file)
@@ -797,7 +797,7 @@ struct btrfs_fs_info {
        /* used to keep from writing metadata until there is a nice batch */
        struct percpu_counter dirty_metadata_bytes;
        struct percpu_counter delalloc_bytes;
-       struct percpu_counter dio_bytes;
+       struct percpu_counter ordered_bytes;
        s32 dirty_metadata_batch;
        s32 delalloc_batch;
 
index 5473bed6a7e894a1bc83cf874ed14f37deb0966e..e0d56b3d122338b49aafb4854b42da002912b871 100644 (file)
@@ -1469,7 +1469,7 @@ void btrfs_free_fs_info(struct btrfs_fs_info *fs_info)
 {
        percpu_counter_destroy(&fs_info->dirty_metadata_bytes);
        percpu_counter_destroy(&fs_info->delalloc_bytes);
-       percpu_counter_destroy(&fs_info->dio_bytes);
+       percpu_counter_destroy(&fs_info->ordered_bytes);
        percpu_counter_destroy(&fs_info->dev_replace.bio_counter);
        btrfs_free_csum_hash(fs_info);
        btrfs_free_stripe_hash_table(fs_info);
@@ -2802,7 +2802,7 @@ static int init_mount_fs_info(struct btrfs_fs_info *fs_info, struct super_block
        sb->s_blocksize = BTRFS_BDEV_BLOCKSIZE;
        sb->s_blocksize_bits = blksize_bits(BTRFS_BDEV_BLOCKSIZE);
 
-       ret = percpu_counter_init(&fs_info->dio_bytes, 0, GFP_KERNEL);
+       ret = percpu_counter_init(&fs_info->ordered_bytes, 0, GFP_KERNEL);
        if (ret)
                return ret;
 
@@ -4163,9 +4163,9 @@ void __cold close_ctree(struct btrfs_fs_info *fs_info)
                       percpu_counter_sum(&fs_info->delalloc_bytes));
        }
 
-       if (percpu_counter_sum(&fs_info->dio_bytes))
+       if (percpu_counter_sum(&fs_info->ordered_bytes))
                btrfs_info(fs_info, "at unmount dio bytes count %lld",
-                          percpu_counter_sum(&fs_info->dio_bytes));
+                          percpu_counter_sum(&fs_info->ordered_bytes));
 
        btrfs_sysfs_remove_mounted(fs_info);
        btrfs_sysfs_remove_fsid(fs_info->fs_devices);
index b4e6500548a2ef84d39eac4d78f803397b7d6a44..e8dee1578d4a1f5eb2a7bf0382004300580fa11e 100644 (file)
@@ -206,11 +206,11 @@ static int __btrfs_add_ordered_extent(struct btrfs_inode *inode, u64 file_offset
               type == BTRFS_ORDERED_COMPRESSED);
        set_bit(type, &entry->flags);
 
-       if (dio) {
-               percpu_counter_add_batch(&fs_info->dio_bytes, num_bytes,
-                                        fs_info->delalloc_batch);
+       percpu_counter_add_batch(&fs_info->ordered_bytes, num_bytes,
+                                fs_info->delalloc_batch);
+
+       if (dio)
                set_bit(BTRFS_ORDERED_DIRECT, &entry->flags);
-       }
 
        /* one ref for the tree */
        refcount_set(&entry->refs, 1);
@@ -503,9 +503,8 @@ void btrfs_remove_ordered_extent(struct btrfs_inode *btrfs_inode,
                btrfs_delalloc_release_metadata(btrfs_inode, entry->num_bytes,
                                                false);
 
-       if (test_bit(BTRFS_ORDERED_DIRECT, &entry->flags))
-               percpu_counter_add_batch(&fs_info->dio_bytes, -entry->num_bytes,
-                                        fs_info->delalloc_batch);
+       percpu_counter_add_batch(&fs_info->ordered_bytes, -entry->num_bytes,
+                                fs_info->delalloc_batch);
 
        tree = &btrfs_inode->ordered_tree;
        spin_lock_irq(&tree->lock);
index d879e3fea0b66e38b4d6d32646b664a992856d1b..711beacd75d60f43544ee001e0e85d7062a52aa8 100644 (file)
@@ -489,7 +489,7 @@ static void shrink_delalloc(struct btrfs_fs_info *fs_info,
 {
        struct btrfs_trans_handle *trans;
        u64 delalloc_bytes;
-       u64 dio_bytes;
+       u64 ordered_bytes;
        u64 items;
        long time_left;
        int loops;
@@ -513,25 +513,20 @@ static void shrink_delalloc(struct btrfs_fs_info *fs_info,
 
        delalloc_bytes = percpu_counter_sum_positive(
                                                &fs_info->delalloc_bytes);
-       dio_bytes = percpu_counter_sum_positive(&fs_info->dio_bytes);
-       if (delalloc_bytes == 0 && dio_bytes == 0) {
-               if (trans)
-                       return;
-               if (wait_ordered)
-                       btrfs_wait_ordered_roots(fs_info, items, 0, (u64)-1);
+       ordered_bytes = percpu_counter_sum_positive(&fs_info->ordered_bytes);
+       if (delalloc_bytes == 0 && ordered_bytes == 0)
                return;
-       }
 
        /*
         * If we are doing more ordered than delalloc we need to just wait on
         * ordered extents, otherwise we'll waste time trying to flush delalloc
         * that likely won't give us the space back we need.
         */
-       if (dio_bytes > delalloc_bytes)
+       if (ordered_bytes > delalloc_bytes)
                wait_ordered = true;
 
        loops = 0;
-       while ((delalloc_bytes || dio_bytes) && loops < 3) {
+       while ((delalloc_bytes || ordered_bytes) && loops < 3) {
                u64 temp = min(delalloc_bytes, to_reclaim) >> PAGE_SHIFT;
                long nr_pages = min_t(u64, temp, LONG_MAX);
 
@@ -556,7 +551,8 @@ static void shrink_delalloc(struct btrfs_fs_info *fs_info,
 
                delalloc_bytes = percpu_counter_sum_positive(
                                                &fs_info->delalloc_bytes);
-               dio_bytes = percpu_counter_sum_positive(&fs_info->dio_bytes);
+               ordered_bytes = percpu_counter_sum_positive(
+                                               &fs_info->ordered_bytes);
        }
 }