[V4,10/15] blk-throttle: add a simple idle detection

Message ID	ba2d677b381e94a2f6c4bf5108f4906c78e99d4f.1479161136.git.shli@fb.com (mailing list archive)
State	New, archived
Headers	show Return-Path: <linux-block-owner@kernel.org> From: Shaohua Li <shli@fb.com> To: <linux-block@vger.kernel.org>, <linux-kernel@vger.kernel.org> CC: <Kernel-team@fb.com>, <axboe@fb.com>, <tj@kernel.org>, <vgoyal@redhat.com> Subject: [PATCH V4 10/15] blk-throttle: add a simple idle detection Date: Mon, 14 Nov 2016 14:22:17 -0800 Message-ID: <ba2d677b381e94a2f6c4bf5108f4906c78e99d4f.1479161136.git.shli@fb.com> In-Reply-To: <cover.1479161136.git.shli@fb.com> References: <cover.1479161136.git.shli@fb.com> MIME-Version: 1.0 Content-Type: text/plain Sender: linux-block-owner@vger.kernel.org Precedence: bulk

diff --git a/block/bio.c b/block/bio.c index db85c57..7baa86d 100644 --- a/block/bio.c +++ b/block/bio.c @@ -30,6 +30,7 @@ #include <linux/cgroup.h> #include <trace/events/block.h> +#include "blk.h" /* * Test patch to inline a certain number of bi_io_vec's inside the bio @@ -1759,6 +1760,7 @@ void bio_endio(struct bio *bio) goto again; } + blk_throtl_bio_endio(bio); if (bio->bi_end_io) bio->bi_end_io(bio); } diff --git a/block/blk-throttle.c b/block/blk-throttle.c index 45a28c4..cb5fd85 100644 --- a/block/blk-throttle.c +++ b/block/blk-throttle.c @@ -21,6 +21,8 @@ static int throtl_quantum = 32; /* Throttling is performed over 100ms slice and after that slice is renewed */ #define DFL_THROTL_SLICE (HZ / 10) #define MAX_THROTL_SLICE (HZ / 5) +#define DFL_IDLE_THRESHOLD_SSD (50 * 1000) /* 50 us */ +#define DFL_IDLE_THRESHOLD_HD (1000 * 1000) /* 1 ms */ static struct blkcg_policy blkcg_policy_throtl; @@ -149,6 +151,10 @@ struct throtl_grp { /* When did we start a new slice */ unsigned long slice_start[2]; unsigned long slice_end[2]; + + u64 last_finish_time; + u64 checked_last_finish_time; + u64 avg_ttime; }; struct throtl_data @@ -172,6 +178,8 @@ struct throtl_data unsigned long high_downgrade_time; unsigned int scale; + + u64 idle_ttime_threshold; }; static void throtl_pending_timer_fn(unsigned long arg); @@ -1629,6 +1637,14 @@ static unsigned long tg_last_high_overflow_time(struct throtl_grp *tg) return ret; } +static bool throtl_tg_is_idle(struct throtl_grp *tg) +{ + /* cgroup is idle if average think time is more than threshold */ + return ktime_get_ns() - tg->last_finish_time > + 4 * tg->td->idle_ttime_threshold || + tg->avg_ttime > tg->td->idle_ttime_threshold; +} + static bool throtl_upgrade_check_one(struct throtl_grp *tg) { struct throtl_service_queue *sq = &tg->service_queue; @@ -1837,6 +1853,19 @@ static void throtl_downgrade_check(struct throtl_grp *tg) tg->last_io_disp[WRITE] = 0; } +static void blk_throtl_update_ttime(struct throtl_grp *tg) +{ + u64 now = ktime_get_ns(); + u64 last_finish_time = tg->last_finish_time; + + if (now <= last_finish_time || last_finish_time == 0 || + last_finish_time == tg->checked_last_finish_time) + return; + + tg->avg_ttime = (tg->avg_ttime * 7 + now - last_finish_time) >> 3; + tg->checked_last_finish_time = last_finish_time; +} + bool blk_throtl_bio(struct request_queue *q, struct blkcg_gq *blkg, struct bio *bio) { @@ -1848,6 +1877,13 @@ bool blk_throtl_bio(struct request_queue *q, struct blkcg_gq *blkg, WARN_ON_ONCE(!rcu_read_lock_held()); + if (tg->td->idle_ttime_threshold == -1) { + if (blk_queue_nonrot(q)) + tg->td->idle_ttime_threshold = DFL_IDLE_THRESHOLD_SSD; + else + tg->td->idle_ttime_threshold = DFL_IDLE_THRESHOLD_HD; + } + /* see throtl_charge_bio() */ if ((bio->bi_opf & REQ_THROTTLED) || !tg->has_rules[rw]) goto out; @@ -1857,6 +1893,11 @@ bool blk_throtl_bio(struct request_queue *q, struct blkcg_gq *blkg, if (unlikely(blk_queue_bypass(q))) goto out_unlock; + bio_associate_current(bio); + bio->bi_cg_private = q; + + blk_throtl_update_ttime(tg); + sq = &tg->service_queue; again: @@ -1917,7 +1958,6 @@ bool blk_throtl_bio(struct request_queue *q, struct blkcg_gq *blkg, tg->last_high_overflow_time[rw] = jiffies; - bio_associate_current(bio); tg->td->nr_queued[rw]++; throtl_add_bio_tg(bio, qn, tg); throttled = true; @@ -1946,6 +1986,34 @@ bool blk_throtl_bio(struct request_queue *q, struct blkcg_gq *blkg, return throttled; } +void blk_throtl_bio_endio(struct bio *bio) +{ + struct blkcg *blkcg; + struct blkcg_gq *blkg; + struct throtl_grp *tg; + struct request_queue *q; + + q = bio->bi_cg_private; + if (!q) + return; + bio->bi_cg_private = NULL; + + rcu_read_lock(); + blkcg = bio_blkcg(bio); + if (!blkcg) + goto end; + blkg = blkg_lookup(blkcg, q); + if (!blkg) + goto end; + + tg = blkg_to_tg(blkg ?: q->root_blkg); + + tg->last_finish_time = ktime_get_ns(); + +end: + rcu_read_unlock(); +} + /* * Dispatch all bios from all children tg's queued on @parent_sq. On * return, @parent_sq is guaranteed to not have any active children tg's @@ -2030,6 +2098,8 @@ int blk_throtl_init(struct request_queue *q) td->limit_index = LIMIT_MAX; td->high_upgrade_time = jiffies; td->high_downgrade_time = jiffies; + + td->idle_ttime_threshold = -1; /* activate policy */ ret = blkcg_activate_policy(q, &blkcg_policy_throtl); if (ret) diff --git a/block/blk.h b/block/blk.h index 39c14dd..b433f35 100644 --- a/block/blk.h +++ b/block/blk.h @@ -292,10 +292,12 @@ extern void blk_throtl_exit(struct request_queue *q); extern ssize_t blk_throtl_slice_show(struct request_queue *q, char *page); extern ssize_t blk_throtl_slice_store(struct request_queue *q, const char *page, size_t count); +extern void blk_throtl_bio_endio(struct bio *bio); #else /* CONFIG_BLK_DEV_THROTTLING */ static inline void blk_throtl_drain(struct request_queue *q) { } static inline int blk_throtl_init(struct request_queue *q) { return 0; } static inline void blk_throtl_exit(struct request_queue *q) { } +static inline void blk_throtl_bio_endio(struct bio *bio) { } #endif /* CONFIG_BLK_DEV_THROTTLING */ #endif /* BLK_INTERNAL_H */ diff --git a/include/linux/blk_types.h b/include/linux/blk_types.h index cd395ec..ff8dd24 100644 --- a/include/linux/blk_types.h +++ b/include/linux/blk_types.h @@ -59,6 +59,7 @@ struct bio { */ struct io_context *bi_ioc; struct cgroup_subsys_state *bi_css; + void *bi_cg_private; #endif union { #if defined(CONFIG_BLK_DEV_INTEGRITY)

[V4,10/15] blk-throttle: add a simple idle detection

Commit Message

Comments

Patch