]> www.infradead.org Git - users/hch/misc.git/commitdiff
block: pre-calculate max_zone_append_sectors
authorChristoph Hellwig <hch@lst.de>
Mon, 4 Nov 2024 07:39:32 +0000 (08:39 +0100)
committerJens Axboe <axboe@kernel.dk>
Mon, 4 Nov 2024 17:34:07 +0000 (10:34 -0700)
max_zone_append_sectors differs from all other queue limits in that the
final value used is not stored in the queue_limits but needs to be
obtained using queue_limits_max_zone_append_sectors helper.  This not
only adds (tiny) extra overhead to the I/O path, but also can be easily
forgotten in file system code.

Add a new max_hw_zone_append_sectors value to queue_limits which is
set by the driver, and calculate max_zone_append_sectors from that and
the other inputs in blk_validate_zoned_limits, similar to how
max_sectors is calculated to fix this.

Signed-off-by: Christoph Hellwig <hch@lst.de>
Link: https://lore.kernel.org/r/20241104073955.112324-3-hch@lst.de
Signed-off-by: Jens Axboe <axboe@kernel.dk>
12 files changed:
block/blk-core.c
block/blk-merge.c
block/blk-settings.c
block/blk-sysfs.c
drivers/block/null_blk/zoned.c
drivers/block/ublk_drv.c
drivers/block/virtio_blk.c
drivers/md/dm-zone.c
drivers/nvme/host/multipath.c
drivers/nvme/host/zns.c
drivers/scsi/sd_zbc.c
include/linux/blkdev.h

index 09d10bb95fda0526588c42b4421b54a5ceac1369..5df4607321ca4d4e33d8cf238a9ce9a8b90226ff 100644 (file)
@@ -607,7 +607,7 @@ static inline blk_status_t blk_check_zone_append(struct request_queue *q,
                return BLK_STS_IOERR;
 
        /* Make sure the BIO is small enough and will not get split */
-       if (nr_sectors > queue_max_zone_append_sectors(q))
+       if (nr_sectors > q->limits.max_zone_append_sectors)
                return BLK_STS_IOERR;
 
        bio->bi_opf |= REQ_NOMERGE;
index d813d799cee72caa0755fec696f10b252efe91ac..7c1375a080ad1df207e7f0e88cb25fd2e95b1ee3 100644 (file)
@@ -388,11 +388,10 @@ struct bio *bio_split_rw(struct bio *bio, const struct queue_limits *lim,
 struct bio *bio_split_zone_append(struct bio *bio,
                const struct queue_limits *lim, unsigned *nr_segs)
 {
-       unsigned int max_sectors = queue_limits_max_zone_append_sectors(lim);
        int split_sectors;
 
        split_sectors = bio_split_rw_at(bio, lim, nr_segs,
-                       max_sectors << SECTOR_SHIFT);
+                       lim->max_zone_append_sectors << SECTOR_SHIFT);
        if (WARN_ON_ONCE(split_sectors > 0))
                split_sectors = -EINVAL;
        return bio_submit_split(bio, split_sectors);
index 5ee3d6d1448dfbdd8a78bdca607cb63c7c96743e..5cb69d85af0e5d05a7ef5b821f02bbe73aab9402 100644 (file)
@@ -91,17 +91,16 @@ static int blk_validate_zoned_limits(struct queue_limits *lim)
        if (lim->zone_write_granularity < lim->logical_block_size)
                lim->zone_write_granularity = lim->logical_block_size;
 
-       if (lim->max_zone_append_sectors) {
-               /*
-                * The Zone Append size is limited by the maximum I/O size
-                * and the zone size given that it can't span zones.
-                */
-               lim->max_zone_append_sectors =
-                       min3(lim->max_hw_sectors,
-                            lim->max_zone_append_sectors,
-                            lim->chunk_sectors);
-       }
-
+       /*
+        * The Zone Append size is limited by the maximum I/O size and the zone
+        * size given that it can't span zones.
+        *
+        * If no max_hw_zone_append_sectors limit is provided, the block layer
+        * will emulated it, else we're also bound by the hardware limit.
+        */
+       lim->max_zone_append_sectors =
+               min_not_zero(lim->max_hw_zone_append_sectors,
+                       min(lim->chunk_sectors, lim->max_hw_sectors));
        return 0;
 }
 
@@ -527,8 +526,8 @@ int blk_stack_limits(struct queue_limits *t, struct queue_limits *b,
        t->max_dev_sectors = min_not_zero(t->max_dev_sectors, b->max_dev_sectors);
        t->max_write_zeroes_sectors = min(t->max_write_zeroes_sectors,
                                        b->max_write_zeroes_sectors);
-       t->max_zone_append_sectors = min(queue_limits_max_zone_append_sectors(t),
-                                        queue_limits_max_zone_append_sectors(b));
+       t->max_hw_zone_append_sectors = min(t->max_hw_zone_append_sectors,
+                                       b->max_hw_zone_append_sectors);
 
        t->seg_boundary_mask = min_not_zero(t->seg_boundary_mask,
                                            b->seg_boundary_mask);
index 741b95dfdbf6f9d1ce54a146907d2220af08b908..d9f22122ae2ff5b15d993da7ebd2f0df78ffcab5 100644 (file)
@@ -131,6 +131,7 @@ QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_BYTES(max_hw_discard_sectors)
 QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_BYTES(max_write_zeroes_sectors)
 QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_BYTES(atomic_write_max_sectors)
 QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_BYTES(atomic_write_boundary_sectors)
+QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_BYTES(max_zone_append_sectors)
 
 #define QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_KB(_field)                   \
 static ssize_t queue_##_field##_show(struct gendisk *disk, char *page) \
@@ -178,18 +179,6 @@ static ssize_t queue_max_discard_sectors_store(struct gendisk *disk,
        return ret;
 }
 
-/*
- * For zone append queue_max_zone_append_sectors does not just return the
- * underlying queue limits, but actually contains a calculation.  Because of
- * that we can't simply use QUEUE_SYSFS_LIMIT_SHOW_SECTORS_TO_BYTES here.
- */
-static ssize_t queue_zone_append_max_show(struct gendisk *disk, char *page)
-{
-       return sprintf(page, "%llu\n",
-               (u64)queue_max_zone_append_sectors(disk->queue) <<
-                       SECTOR_SHIFT);
-}
-
 static ssize_t
 queue_max_sectors_store(struct gendisk *disk, const char *page, size_t count)
 {
@@ -479,7 +468,7 @@ QUEUE_RO_ENTRY(queue_atomic_write_unit_min, "atomic_write_unit_min_bytes");
 
 QUEUE_RO_ENTRY(queue_write_same_max, "write_same_max_bytes");
 QUEUE_RO_ENTRY(queue_max_write_zeroes_sectors, "write_zeroes_max_bytes");
-QUEUE_RO_ENTRY(queue_zone_append_max, "zone_append_max_bytes");
+QUEUE_RO_ENTRY(queue_max_zone_append_sectors, "zone_append_max_bytes");
 QUEUE_RO_ENTRY(queue_zone_write_granularity, "zone_write_granularity");
 
 QUEUE_RO_ENTRY(queue_zoned, "zoned");
@@ -607,7 +596,7 @@ static struct attribute *queue_attrs[] = {
        &queue_atomic_write_unit_max_entry.attr,
        &queue_write_same_max_entry.attr,
        &queue_max_write_zeroes_sectors_entry.attr,
-       &queue_zone_append_max_entry.attr,
+       &queue_max_zone_append_sectors_entry.attr,
        &queue_zone_write_granularity_entry.attr,
        &queue_rotational_entry.attr,
        &queue_zoned_entry.attr,
index 9bc768b2ca56b7bad7c4dc1393ad09ebaba3b65a..0d5f9bf952292ec90bfa5bd89f267cab38431355 100644 (file)
@@ -166,7 +166,7 @@ int null_init_zoned_dev(struct nullb_device *dev,
 
        lim->features |= BLK_FEAT_ZONED;
        lim->chunk_sectors = dev->zone_size_sects;
-       lim->max_zone_append_sectors = dev->zone_append_max_sectors;
+       lim->max_hw_zone_append_sectors = dev->zone_append_max_sectors;
        lim->max_open_zones = dev->zone_max_open;
        lim->max_active_zones = dev->zone_max_active;
        return 0;
index 59951e7c25939f471a777956916fa768d8c46e18..8d938b2b41eec3d24ffa79158f2141c15944d651 100644 (file)
@@ -2270,7 +2270,7 @@ static int ublk_ctrl_start_dev(struct ublk_device *ub, struct io_uring_cmd *cmd)
                lim.features |= BLK_FEAT_ZONED;
                lim.max_active_zones = p->max_active_zones;
                lim.max_open_zones =  p->max_open_zones;
-               lim.max_zone_append_sectors = p->max_zone_append_sectors;
+               lim.max_hw_zone_append_sectors = p->max_zone_append_sectors;
        }
 
        if (ub->params.basic.attrs & UBLK_ATTR_VOLATILE_CACHE) {
index 194417abc1053c0c73a8efdfe45b13c24534eec0..0e99a4714928478c1ba81777b8e98448eb5b992a 100644 (file)
@@ -784,7 +784,7 @@ static int virtblk_read_zoned_limits(struct virtio_blk *vblk,
                        wg, v);
                return -ENODEV;
        }
-       lim->max_zone_append_sectors = v;
+       lim->max_hw_zone_append_sectors = v;
        dev_dbg(&vdev->dev, "max append sectors = %u\n", v);
 
        return 0;
index c0d41c36e06ebf8a0a32968185227ac073c80ad4..20edd3fabbabfe622783030b6106de2a9b890fcf 100644 (file)
@@ -344,7 +344,7 @@ int dm_set_zones_restrictions(struct dm_table *t, struct request_queue *q,
                clear_bit(DMF_EMULATE_ZONE_APPEND, &md->flags);
        } else {
                set_bit(DMF_EMULATE_ZONE_APPEND, &md->flags);
-               lim->max_zone_append_sectors = 0;
+               lim->max_hw_zone_append_sectors = 0;
        }
 
        /*
@@ -379,7 +379,7 @@ int dm_set_zones_restrictions(struct dm_table *t, struct request_queue *q,
        if (!zlim.mapped_nr_seq_zones) {
                lim->max_open_zones = 0;
                lim->max_active_zones = 0;
-               lim->max_zone_append_sectors = 0;
+               lim->max_hw_zone_append_sectors = 0;
                lim->zone_write_granularity = 0;
                lim->chunk_sectors = 0;
                lim->features &= ~BLK_FEAT_ZONED;
index 6a15873055b9513f827709ad780bc7e18f75e439..c26cb7d3a2e55bfe08f4da317298411e2033ca68 100644 (file)
@@ -636,7 +636,7 @@ int nvme_mpath_alloc_disk(struct nvme_ctrl *ctrl, struct nvme_ns_head *head)
        if (head->ids.csi == NVME_CSI_ZNS)
                lim.features |= BLK_FEAT_ZONED;
        else
-               lim.max_zone_append_sectors = 0;
+               lim.max_hw_zone_append_sectors = 0;
 
        head->disk = blk_alloc_disk(&lim, ctrl->numa_node);
        if (IS_ERR(head->disk))
index 9a06f9d98cd68c5691716760f63ada3fbf3d4275..382949e18c6ae7635b511258b04a7740ea4909c8 100644 (file)
@@ -111,7 +111,7 @@ void nvme_update_zone_info(struct nvme_ns *ns, struct queue_limits *lim,
        lim->features |= BLK_FEAT_ZONED;
        lim->max_open_zones = zi->max_open_zones;
        lim->max_active_zones = zi->max_active_zones;
-       lim->max_zone_append_sectors = ns->ctrl->max_zone_append;
+       lim->max_hw_zone_append_sectors = ns->ctrl->max_zone_append;
        lim->chunk_sectors = ns->head->zsze =
                nvme_lba_to_sect(ns->head, zi->zone_size);
 }
index ee2b742387581bc13ecbe4ef8a826d53b031a8d8..de5c54c057ecd7540fd2b825457cd0037a468e2a 100644 (file)
@@ -634,8 +634,6 @@ int sd_zbc_read_zones(struct scsi_disk *sdkp, struct queue_limits *lim,
                lim->max_open_zones = sdkp->zones_max_open;
        lim->max_active_zones = 0;
        lim->chunk_sectors = logical_to_sectors(sdkp->device, zone_blocks);
-       /* Enable block layer zone append emulation */
-       lim->max_zone_append_sectors = 0;
 
        return 0;
 
index 7bfc877e159e1e81ec0d0747eaaa06d3d856cdb7..6d1413bd69a5bfa2939f687af71ffceb05a83b34 100644 (file)
@@ -375,6 +375,7 @@ struct queue_limits {
        unsigned int            max_user_discard_sectors;
        unsigned int            max_secure_erase_sectors;
        unsigned int            max_write_zeroes_sectors;
+       unsigned int            max_hw_zone_append_sectors;
        unsigned int            max_zone_append_sectors;
        unsigned int            discard_granularity;
        unsigned int            discard_alignment;
@@ -1204,25 +1205,9 @@ static inline unsigned int queue_max_segment_size(const struct request_queue *q)
        return q->limits.max_segment_size;
 }
 
-static inline unsigned int
-queue_limits_max_zone_append_sectors(const struct queue_limits *l)
-{
-       unsigned int max_sectors = min(l->chunk_sectors, l->max_hw_sectors);
-
-       return min_not_zero(l->max_zone_append_sectors, max_sectors);
-}
-
-static inline unsigned int queue_max_zone_append_sectors(struct request_queue *q)
-{
-       if (!blk_queue_is_zoned(q))
-               return 0;
-
-       return queue_limits_max_zone_append_sectors(&q->limits);
-}
-
 static inline bool queue_emulates_zone_append(struct request_queue *q)
 {
-       return blk_queue_is_zoned(q) && !q->limits.max_zone_append_sectors;
+       return blk_queue_is_zoned(q) && !q->limits.max_hw_zone_append_sectors;
 }
 
 static inline bool bdev_emulates_zone_append(struct block_device *bdev)
@@ -1233,7 +1218,7 @@ static inline bool bdev_emulates_zone_append(struct block_device *bdev)
 static inline unsigned int
 bdev_max_zone_append_sectors(struct block_device *bdev)
 {
-       return queue_max_zone_append_sectors(bdev_get_queue(bdev));
+       return bdev_limits(bdev)->max_zone_append_sectors;
 }
 
 static inline unsigned int bdev_max_segments(struct block_device *bdev)