[parent not found: <20221217030527.1250083-1-yukuai1-XF6JlduFytWkHkcT6e4Xnw@public.gmane.org>]
* [PATCH -next 1/4] blk-iocost: track whether iocg is still online
[not found] ` <20221217030527.1250083-1-yukuai1-XF6JlduFytWkHkcT6e4Xnw@public.gmane.org>
@ 2022-12-17 3:05 ` Yu Kuai
2022-12-21 10:33 ` Christoph Hellwig
0 siblings, 1 reply; 10+ messages in thread
From: Yu Kuai @ 2022-12-17 3:05 UTC (permalink / raw)
To: tj-DgEjT+Ai2ygdnm+yROfE0A, hch-wEGCiKHe2LqWVfeAwA7xHQ,
josef-DigfWCa+lFGyeJad7bwFQA, axboe-tSWWG44O7X1aa/9Udqfwiw
Cc: cgroups-u79uwXL29TY76Z2rM5mHXA,
linux-block-u79uwXL29TY76Z2rM5mHXA,
linux-kernel-u79uwXL29TY76Z2rM5mHXA,
yukuai3-hv44wF8Li93QT0dZR+AlfA, yukuai1-XF6JlduFytWkHkcT6e4Xnw,
yi.zhang-hv44wF8Li93QT0dZR+AlfA
From: Yu Kuai <yukuai3-hv44wF8Li93QT0dZR+AlfA@public.gmane.org>
blkcg_gq->online can't be used in iocost because it gets cleared only after
all policies are offlined. This patch add a new field 'online' in iocg.
Signed-off-by: Yu Kuai <yukuai3-hv44wF8Li93QT0dZR+AlfA@public.gmane.org>
---
block/blk-iocost.c | 17 +++++++++++++++++
1 file changed, 17 insertions(+)
diff --git a/block/blk-iocost.c b/block/blk-iocost.c
index 3aeb8538f0c3..1498879c4a52 100644
--- a/block/blk-iocost.c
+++ b/block/blk-iocost.c
@@ -459,6 +459,8 @@ struct ioc_gq {
struct blkg_policy_data pd;
struct ioc *ioc;
+ bool online;
+
/*
* A iocg can get its weight from two sources - an explicit
* per-device-cgroup configuration or the default weight of the
@@ -2952,6 +2954,7 @@ static void ioc_pd_init(struct blkg_policy_data *pd)
ioc_now(ioc, &now);
iocg->ioc = ioc;
+ iocg->online = true;
atomic64_set(&iocg->vtime, now.vnow);
atomic64_set(&iocg->done_vtime, now.vnow);
atomic64_set(&iocg->active_period, atomic64_read(&ioc->cur_period));
@@ -2977,6 +2980,19 @@ static void ioc_pd_init(struct blkg_policy_data *pd)
spin_unlock_irqrestore(&ioc->lock, flags);
}
+static void ioc_pd_offline(struct blkg_policy_data *pd)
+{
+ struct ioc_gq *iocg = pd_to_iocg(pd);
+ struct ioc *ioc = iocg->ioc;
+ unsigned long flags;
+
+ if (ioc) {
+ spin_lock_irqsave(&ioc->lock, flags);
+ iocg->online = false;
+ spin_unlock_irqrestore(&ioc->lock, flags);
+ }
+}
+
static void ioc_pd_free(struct blkg_policy_data *pd)
{
struct ioc_gq *iocg = pd_to_iocg(pd);
@@ -3467,6 +3483,7 @@ static struct blkcg_policy blkcg_policy_iocost = {
.cpd_free_fn = ioc_cpd_free,
.pd_alloc_fn = ioc_pd_alloc,
.pd_init_fn = ioc_pd_init,
+ .pd_offline_fn = ioc_pd_offline,
.pd_free_fn = ioc_pd_free,
.pd_stat_fn = ioc_pd_stat,
};
--
2.31.1
^ permalink raw reply related [flat|nested] 10+ messages in thread* Re: [PATCH -next 1/4] blk-iocost: track whether iocg is still online
2022-12-17 3:05 ` [PATCH -next 1/4] blk-iocost: track whether iocg is still online Yu Kuai
@ 2022-12-21 10:33 ` Christoph Hellwig
[not found] ` <Y6LhD8CEkcgLUJoQ-wEGCiKHe2LqWVfeAwA7xHQ@public.gmane.org>
0 siblings, 1 reply; 10+ messages in thread
From: Christoph Hellwig @ 2022-12-21 10:33 UTC (permalink / raw)
To: Yu Kuai
Cc: tj, hch, josef, axboe, cgroups, linux-block, linux-kernel,
yukuai3, yi.zhang
On Sat, Dec 17, 2022 at 11:05:24AM +0800, Yu Kuai wrote:
> @@ -459,6 +459,8 @@ struct ioc_gq {
> struct blkg_policy_data pd;
> struct ioc *ioc;
>
> + bool online;
Nit: maybe tab align this field like the fields above it.
> +static void ioc_pd_offline(struct blkg_policy_data *pd)
> +{
> + struct ioc_gq *iocg = pd_to_iocg(pd);
> + struct ioc *ioc = iocg->ioc;
> + unsigned long flags;
> +
> + if (ioc) {
How could ioc be NULL here?
^ permalink raw reply [flat|nested] 10+ messages in thread
* [PATCH -next 2/4] blk-iocost: don't throttle bio if iocg is offlined
2022-12-17 3:05 [PATCH -next 0/4] blk-iocost: make sure parent iocg is exited before child Yu Kuai
[not found] ` <20221217030527.1250083-1-yukuai1-XF6JlduFytWkHkcT6e4Xnw@public.gmane.org>
@ 2022-12-17 3:05 ` Yu Kuai
2022-12-19 21:28 ` Tejun Heo
2022-12-17 3:05 ` [PATCH -next 3/4] blk-iocost: dispatch all throttled bio in ioc_pd_offline Yu Kuai
2022-12-17 3:05 ` [PATCH -next 4/4] blk-iocost: guarantee the exit order of iocg Yu Kuai
3 siblings, 1 reply; 10+ messages in thread
From: Yu Kuai @ 2022-12-17 3:05 UTC (permalink / raw)
To: tj, hch, josef, axboe
Cc: cgroups, linux-block, linux-kernel, yukuai3, yukuai1, yi.zhang
From: Yu Kuai <yukuai3@huawei.com>
bio will grab blkg reference, however, blkcg->online_pin is not grabbed,
hence cgroup can be removed after thread exit while bio is still in
progress. Bypass io in this case since it doesn't make sense to
throttle bio while cgroup is removed.
This patch also prepare to move operations on iocg from ioc_pd_free()
to ioc_pd_offline().
Signed-off-by: Yu Kuai <yukuai3@huawei.com>
---
block/blk-iocost.c | 24 ++++++++++++++++++++----
1 file changed, 20 insertions(+), 4 deletions(-)
diff --git a/block/blk-iocost.c b/block/blk-iocost.c
index 1498879c4a52..23cc734dbe43 100644
--- a/block/blk-iocost.c
+++ b/block/blk-iocost.c
@@ -695,6 +695,20 @@ static struct ioc_cgrp *blkcg_to_iocc(struct blkcg *blkcg)
struct ioc_cgrp, cpd);
}
+static struct ioc_gq *ioc_bio_iocg(struct bio *bio)
+{
+ struct blkcg_gq *blkg = bio->bi_blkg;
+
+ if (blkg && blkg->online) {
+ struct ioc_gq *iocg = blkg_to_iocg(blkg);
+
+ if (iocg && iocg->online)
+ return iocg;
+ }
+
+ return NULL;
+}
+
/*
* Scale @abs_cost to the inverse of @hw_inuse. The lower the hierarchical
* weight, the more expensive each IO. Must round up.
@@ -1262,6 +1276,9 @@ static bool iocg_activate(struct ioc_gq *iocg, struct ioc_now *now)
spin_lock_irq(&ioc->lock);
+ if (!iocg->online)
+ goto fail_unlock;
+
ioc_now(ioc, now);
/* update period */
@@ -2561,9 +2578,8 @@ static u64 calc_size_vtime_cost(struct request *rq, struct ioc *ioc)
static void ioc_rqos_throttle(struct rq_qos *rqos, struct bio *bio)
{
- struct blkcg_gq *blkg = bio->bi_blkg;
struct ioc *ioc = rqos_to_ioc(rqos);
- struct ioc_gq *iocg = blkg_to_iocg(blkg);
+ struct ioc_gq *iocg = ioc_bio_iocg(bio);
struct ioc_now now;
struct iocg_wait wait;
u64 abs_cost, cost, vtime;
@@ -2697,7 +2713,7 @@ static void ioc_rqos_throttle(struct rq_qos *rqos, struct bio *bio)
static void ioc_rqos_merge(struct rq_qos *rqos, struct request *rq,
struct bio *bio)
{
- struct ioc_gq *iocg = blkg_to_iocg(bio->bi_blkg);
+ struct ioc_gq *iocg = ioc_bio_iocg(bio);
struct ioc *ioc = rqos_to_ioc(rqos);
sector_t bio_end = bio_end_sector(bio);
struct ioc_now now;
@@ -2755,7 +2771,7 @@ static void ioc_rqos_merge(struct rq_qos *rqos, struct request *rq,
static void ioc_rqos_done_bio(struct rq_qos *rqos, struct bio *bio)
{
- struct ioc_gq *iocg = blkg_to_iocg(bio->bi_blkg);
+ struct ioc_gq *iocg = ioc_bio_iocg(bio);
if (iocg && bio->bi_iocost_cost)
atomic64_add(bio->bi_iocost_cost, &iocg->done_vtime);
--
2.31.1
^ permalink raw reply related [flat|nested] 10+ messages in thread* Re: [PATCH -next 2/4] blk-iocost: don't throttle bio if iocg is offlined
2022-12-17 3:05 ` [PATCH -next 2/4] blk-iocost: don't throttle bio if iocg is offlined Yu Kuai
@ 2022-12-19 21:28 ` Tejun Heo
[not found] ` <Y6DXkLeOmu7VWovz-NiLfg/pYEd1N0TnZuCh8vA@public.gmane.org>
0 siblings, 1 reply; 10+ messages in thread
From: Tejun Heo @ 2022-12-19 21:28 UTC (permalink / raw)
To: Yu Kuai
Cc: hch, josef, axboe, cgroups, linux-block, linux-kernel, yukuai3,
yi.zhang
On Sat, Dec 17, 2022 at 11:05:25AM +0800, Yu Kuai wrote:
> From: Yu Kuai <yukuai3@huawei.com>
>
> bio will grab blkg reference, however, blkcg->online_pin is not grabbed,
> hence cgroup can be removed after thread exit while bio is still in
> progress. Bypass io in this case since it doesn't make sense to
> throttle bio while cgroup is removed.
I don't get it. Why wouldn't that make sense? ISTR some occasions where we
clear the config to mitigate exits stalling for too long but in general a
policy being active on a draining cgroup shouldn't be a problem.
Thanks.
--
tejun
^ permalink raw reply [flat|nested] 10+ messages in thread
* [PATCH -next 3/4] blk-iocost: dispatch all throttled bio in ioc_pd_offline
2022-12-17 3:05 [PATCH -next 0/4] blk-iocost: make sure parent iocg is exited before child Yu Kuai
[not found] ` <20221217030527.1250083-1-yukuai1-XF6JlduFytWkHkcT6e4Xnw@public.gmane.org>
2022-12-17 3:05 ` [PATCH -next 2/4] blk-iocost: don't throttle bio if iocg is offlined Yu Kuai
@ 2022-12-17 3:05 ` Yu Kuai
[not found] ` <20221217030527.1250083-4-yukuai1-XF6JlduFytWkHkcT6e4Xnw@public.gmane.org>
2022-12-17 3:05 ` [PATCH -next 4/4] blk-iocost: guarantee the exit order of iocg Yu Kuai
3 siblings, 1 reply; 10+ messages in thread
From: Yu Kuai @ 2022-12-17 3:05 UTC (permalink / raw)
To: tj, hch, josef, axboe
Cc: cgroups, linux-block, linux-kernel, yukuai3, yukuai1, yi.zhang
From: Yu Kuai <yukuai3@huawei.com>
Currently, if cgroup is removed while some bio is still throttled, such
bio will still wait for timer to dispatch. On the one hand, it
doesn't make sense to throttle bio while cgroup is removed, on the other
hand, this behaviour makes it hard to guarantee the exit order for
iocg(in ioc_pd_free() currently).
This patch make iocg->online updated under both 'ioc->lock' and
'iocg->waitq.lock', so it can be guaranteed that iocg will stay online
while holding any lock. In the meantime, all throttled bio will be
dispatched immediately in ioc_pd_offline().
This patch also prepare to move operations on iocg from ioc_pd_free()
to ioc_pd_offline().
Signed-off-by: Yu Kuai <yukuai3@huawei.com>
---
block/blk-iocost.c | 25 ++++++++++++++++---------
1 file changed, 16 insertions(+), 9 deletions(-)
diff --git a/block/blk-iocost.c b/block/blk-iocost.c
index 23cc734dbe43..b63ecfdd815c 100644
--- a/block/blk-iocost.c
+++ b/block/blk-iocost.c
@@ -1448,14 +1448,18 @@ static int iocg_wake_fn(struct wait_queue_entry *wq_entry, unsigned mode,
{
struct iocg_wait *wait = container_of(wq_entry, struct iocg_wait, wait);
struct iocg_wake_ctx *ctx = key;
- u64 cost = abs_cost_to_cost(wait->abs_cost, ctx->hw_inuse);
- ctx->vbudget -= cost;
+ if (ctx->iocg->online) {
+ u64 cost = abs_cost_to_cost(wait->abs_cost, ctx->hw_inuse);
- if (ctx->vbudget < 0)
- return -1;
+ ctx->vbudget -= cost;
+
+ if (ctx->vbudget < 0)
+ return -1;
+
+ iocg_commit_bio(ctx->iocg, wait->bio, wait->abs_cost, cost);
+ }
- iocg_commit_bio(ctx->iocg, wait->bio, wait->abs_cost, cost);
wait->committed = true;
/*
@@ -3003,9 +3007,14 @@ static void ioc_pd_offline(struct blkg_policy_data *pd)
unsigned long flags;
if (ioc) {
- spin_lock_irqsave(&ioc->lock, flags);
+ struct iocg_wake_ctx ctx = { .iocg = iocg };
+
+ iocg_lock(iocg, true, &flags);
iocg->online = false;
- spin_unlock_irqrestore(&ioc->lock, flags);
+ iocg_unlock(iocg, true, &flags);
+
+ hrtimer_cancel(&iocg->waitq_timer);
+ __wake_up(&iocg->waitq, TASK_NORMAL, 0, &ctx);
}
}
@@ -3030,8 +3039,6 @@ static void ioc_pd_free(struct blkg_policy_data *pd)
WARN_ON_ONCE(!list_empty(&iocg->surplus_list));
spin_unlock_irqrestore(&ioc->lock, flags);
-
- hrtimer_cancel(&iocg->waitq_timer);
}
free_percpu(iocg->pcpu_stat);
kfree(iocg);
--
2.31.1
^ permalink raw reply related [flat|nested] 10+ messages in thread* [PATCH -next 4/4] blk-iocost: guarantee the exit order of iocg
2022-12-17 3:05 [PATCH -next 0/4] blk-iocost: make sure parent iocg is exited before child Yu Kuai
` (2 preceding siblings ...)
2022-12-17 3:05 ` [PATCH -next 3/4] blk-iocost: dispatch all throttled bio in ioc_pd_offline Yu Kuai
@ 2022-12-17 3:05 ` Yu Kuai
3 siblings, 0 replies; 10+ messages in thread
From: Yu Kuai @ 2022-12-17 3:05 UTC (permalink / raw)
To: tj, hch, josef, axboe
Cc: cgroups, linux-block, linux-kernel, yukuai3, yukuai1, yi.zhang
From: Yu Kuai <yukuai3@huawei.com>
pd_offline_fn() is ensured to be called in order(parent after child),
while pd_free_fn() is not. Furthermore, rq_qos_exit() can also be called
before pd_free_fn(). For conclusion, doing cleanups in ioc_pd_free() is
not safe, which can cause many problems. By the way, iocost is the only
policy to do cleanups in pd_free_fn().
Since previous patches guarantee that ioc_pd_offline() will dispatch
throttled bio and prevent new io to be throttled. It's safe to move
cleanup operations for iocg from ioc_pd_free() to ioc_pd_offline().
Signed-off-by: Yu Kuai <yukuai3@huawei.com>
---
block/blk-iocost.c | 26 ++++++++++----------------
1 file changed, 10 insertions(+), 16 deletions(-)
diff --git a/block/blk-iocost.c b/block/blk-iocost.c
index b63ecfdd815c..d634ea73f991 100644
--- a/block/blk-iocost.c
+++ b/block/blk-iocost.c
@@ -3011,21 +3011,6 @@ static void ioc_pd_offline(struct blkg_policy_data *pd)
iocg_lock(iocg, true, &flags);
iocg->online = false;
- iocg_unlock(iocg, true, &flags);
-
- hrtimer_cancel(&iocg->waitq_timer);
- __wake_up(&iocg->waitq, TASK_NORMAL, 0, &ctx);
- }
-}
-
-static void ioc_pd_free(struct blkg_policy_data *pd)
-{
- struct ioc_gq *iocg = pd_to_iocg(pd);
- struct ioc *ioc = iocg->ioc;
- unsigned long flags;
-
- if (ioc) {
- spin_lock_irqsave(&ioc->lock, flags);
if (!list_empty(&iocg->active_list)) {
struct ioc_now now;
@@ -3038,8 +3023,17 @@ static void ioc_pd_free(struct blkg_policy_data *pd)
WARN_ON_ONCE(!list_empty(&iocg->walk_list));
WARN_ON_ONCE(!list_empty(&iocg->surplus_list));
- spin_unlock_irqrestore(&ioc->lock, flags);
+ iocg_unlock(iocg, true, &flags);
+
+ hrtimer_cancel(&iocg->waitq_timer);
+ __wake_up(&iocg->waitq, TASK_NORMAL, 0, &ctx);
}
+}
+
+static void ioc_pd_free(struct blkg_policy_data *pd)
+{
+ struct ioc_gq *iocg = pd_to_iocg(pd);
+
free_percpu(iocg->pcpu_stat);
kfree(iocg);
}
--
2.31.1
^ permalink raw reply related [flat|nested] 10+ messages in thread