summaryrefslogtreecommitdiffstats
path: root/block/blk-throttle.c
diff options
context:
space:
mode:
authorShaohua Li <shli@fb.com>2017-03-27 13:51:39 -0400
committerJens Axboe <axboe@fb.com>2017-03-28 10:02:20 -0400
commitaec242468cb84b8eea7130c10530a69d2b352bff (patch)
treeca582c28dd2c2023025456691b19ff420b5939e5 /block/blk-throttle.c
parentd61fcfa4bb18992dc8e171996808e1034dc643bb (diff)
blk-throttle: detect completed idle cgroup
cgroup could be assigned a limit, but doesn't dispatch enough IO, eg the cgroup is idle. When this happens, the cgroup doesn't hit its limit, so we can't move the state machine to higher level and all cgroups will be throttled to their lower limit, so we waste bandwidth. Detecting idle cgroup is hard. This patch handles a simple case, a cgroup doesn't dispatch any IO. We ignore such cgroup's limit, so other cgroups can use the bandwidth. Please note this will be replaced with a more sophisticated algorithm later, but this demonstrates the idea how we handle idle cgroups, so I leave it here. Signed-off-by: Shaohua Li <shli@fb.com> Signed-off-by: Jens Axboe <axboe@fb.com>
Diffstat (limited to 'block/blk-throttle.c')
-rw-r--r--block/blk-throttle.c19
1 files changed, 18 insertions, 1 deletions
diff --git a/block/blk-throttle.c b/block/blk-throttle.c
index d00c1c1e99e4..014b2e96a423 100644
--- a/block/blk-throttle.c
+++ b/block/blk-throttle.c
@@ -149,6 +149,8 @@ struct throtl_grp {
149 149
150 unsigned long last_check_time; 150 unsigned long last_check_time;
151 151
152 unsigned long last_dispatch_time[2];
153
152 /* When did we start a new slice */ 154 /* When did we start a new slice */
153 unsigned long slice_start[2]; 155 unsigned long slice_start[2];
154 unsigned long slice_end[2]; 156 unsigned long slice_end[2];
@@ -445,11 +447,14 @@ static void tg_update_has_rules(struct throtl_grp *tg)
445 447
446static void throtl_pd_online(struct blkg_policy_data *pd) 448static void throtl_pd_online(struct blkg_policy_data *pd)
447{ 449{
450 struct throtl_grp *tg = pd_to_tg(pd);
448 /* 451 /*
449 * We don't want new groups to escape the limits of its ancestors. 452 * We don't want new groups to escape the limits of its ancestors.
450 * Update has_rules[] after a new group is brought online. 453 * Update has_rules[] after a new group is brought online.
451 */ 454 */
452 tg_update_has_rules(pd_to_tg(pd)); 455 tg_update_has_rules(tg);
456 tg->last_dispatch_time[READ] = jiffies;
457 tg->last_dispatch_time[WRITE] = jiffies;
453} 458}
454 459
455static void blk_throtl_update_limit_valid(struct throtl_data *td) 460static void blk_throtl_update_limit_valid(struct throtl_data *td)
@@ -1615,6 +1620,12 @@ static bool throtl_tg_can_upgrade(struct throtl_grp *tg)
1615 if (write_limit && sq->nr_queued[WRITE] && 1620 if (write_limit && sq->nr_queued[WRITE] &&
1616 (!read_limit || sq->nr_queued[READ])) 1621 (!read_limit || sq->nr_queued[READ]))
1617 return true; 1622 return true;
1623
1624 if (time_after_eq(jiffies,
1625 tg->last_dispatch_time[READ] + tg->td->throtl_slice) &&
1626 time_after_eq(jiffies,
1627 tg->last_dispatch_time[WRITE] + tg->td->throtl_slice))
1628 return true;
1618 return false; 1629 return false;
1619} 1630}
1620 1631
@@ -1692,6 +1703,11 @@ static bool throtl_tg_can_downgrade(struct throtl_grp *tg)
1692 struct throtl_data *td = tg->td; 1703 struct throtl_data *td = tg->td;
1693 unsigned long now = jiffies; 1704 unsigned long now = jiffies;
1694 1705
1706 if (time_after_eq(now, tg->last_dispatch_time[READ] +
1707 td->throtl_slice) &&
1708 time_after_eq(now, tg->last_dispatch_time[WRITE] +
1709 td->throtl_slice))
1710 return false;
1695 /* 1711 /*
1696 * If cgroup is below low limit, consider downgrade and throttle other 1712 * If cgroup is below low limit, consider downgrade and throttle other
1697 * cgroups 1713 * cgroups
@@ -1800,6 +1816,7 @@ bool blk_throtl_bio(struct request_queue *q, struct blkcg_gq *blkg,
1800 1816
1801again: 1817again:
1802 while (true) { 1818 while (true) {
1819 tg->last_dispatch_time[rw] = jiffies;
1803 if (tg->last_low_overflow_time[rw] == 0) 1820 if (tg->last_low_overflow_time[rw] == 0)
1804 tg->last_low_overflow_time[rw] = jiffies; 1821 tg->last_low_overflow_time[rw] = jiffies;
1805 throtl_downgrade_check(tg); 1822 throtl_downgrade_check(tg);