blk-throttle: support prioritized processing of metadata

author Yu Kuai <yukuai3@huawei.com>

Tue, 3 Sep 2024 13:51:49 +0000 (21:51 +0800)

committer Jens Axboe <axboe@kernel.dk>

Tue, 10 Sep 2024 22:31:41 +0000 (16:31 -0600)
author Yu Kuai <yukuai3@huawei.com>
Tue, 3 Sep 2024 13:51:49 +0000 (21:51 +0800)
committer Jens Axboe <axboe@kernel.dk>
Tue, 10 Sep 2024 22:31:41 +0000 (16:31 -0600)
diff --git a/block/blk-throttle.c b/block/blk-throttle.c

index eb859c44c9f337ce23f3cc148903b5a02eed8840..9c5bbd26172474a51192bd99c5ba769f49cac55f 100644 (file)
--- a/block/blk-throttle.c
+++ b/block/blk-throttle.c
@@ -1595,6 +1595,22 @@ void blk_throtl_cancel_bios(struct gendisk *disk)
         spin_unlock_irq(&q->queue_lock);
  }
  
+static bool tg_within_limit(struct throtl_grp *tg, struct bio *bio, bool rw)
+{
+       /* throtl is FIFO - if bios are already queued, should queue */
+       if (tg->service_queue.nr_queued[rw])
+               return false;
+
+       return tg_may_dispatch(tg, bio, NULL);
+}
+
+static void tg_dispatch_in_debt(struct throtl_grp *tg, struct bio *bio, bool rw)
+{
+       if (!bio_flagged(bio, BIO_BPS_THROTTLED))
+               tg->carryover_bytes[rw] -= throtl_bio_data_size(bio);
+       tg->carryover_ios[rw]--;
+}
+
  bool __blk_throtl_bio(struct bio *bio)
  {
         struct request_queue *q = bdev_get_queue(bio->bi_bdev);
@@ -1611,29 +1627,34 @@ bool __blk_throtl_bio(struct bio *bio)
         sq = &tg->service_queue;
  
         while (true) {
-               /* throtl is FIFO - if bios are already queued, should queue */
-               if (sq->nr_queued[rw])
+               if (tg_within_limit(tg, bio, rw)) {
+                       /* within limits, let's charge and dispatch directly */
+                       throtl_charge_bio(tg, bio);
+
+                       /*
+                        * We need to trim slice even when bios are not being
+                        * queued otherwise it might happen that a bio is not
+                        * queued for a long time and slice keeps on extending
+                        * and trim is not called for a long time. Now if limits
+                        * are reduced suddenly we take into account all the IO
+                        * dispatched so far at new low rate and * newly queued
+                        * IO gets a really long dispatch time.
+                        *
+                        * So keep on trimming slice even if bio is not queued.
+                        */
+                       throtl_trim_slice(tg, rw);
+               } else if (bio_issue_as_root_blkg(bio)) {
+                       /*
+                        * IOs which may cause priority inversions are
+                        * dispatched directly, even if they're over limit.
+                        * Debts are handled by carryover_bytes/ios while
+                        * calculating wait time.
+                        */
+                       tg_dispatch_in_debt(tg, bio, rw);
+               } else {
+                       /* if above limits, break to queue */
                         break;
-
-               /* if above limits, break to queue */
-               if (!tg_may_dispatch(tg, bio, NULL))
-                       break;
-
-               /* within limits, let's charge and dispatch directly */
-               throtl_charge_bio(tg, bio);
-
-               /*
-                * We need to trim slice even when bios are not being queued
-                * otherwise it might happen that a bio is not queued for
-                * a long time and slice keeps on extending and trim is not
-                * called for a long time. Now if limits are reduced suddenly
-                * we take into account all the IO dispatched so far at new
-                * low rate and * newly queued IO gets a really long dispatch
-                * time.
-                *
-                * So keep on trimming slice even if bio is not queued.
-                */
-               throtl_trim_slice(tg, rw);
+               }
  
                 /*
                  * @bio passed through this layer without being throttled.
author	Yu Kuai <yukuai3@huawei.com>
	Tue, 3 Sep 2024 13:51:49 +0000 (21:51 +0800)
committer	Jens Axboe <axboe@kernel.dk>
	Tue, 10 Sep 2024 22:31:41 +0000 (16:31 -0600)