Lines Matching +full:down +full:- +full:scaling
1 // SPDX-License-Identifier: GPL-2.0
6 * - Monitor latencies in a defined window of time.
7 * - If the minimum latency in the above window exceeds some target, increment
8 * scaling step and scale down queue depth by a factor of 2x. The monitoring
9 * window is then shrunk to 100 / sqrt(scaling step + 1).
10 * - For any window where we don't have solid data on what the latencies
12 * - If latencies look good, decrement scaling step.
13 * - If we're only doing writes, allow the scaling step to go negative. This
15 * scaling step of 0 if reads show up or the heavy writers finish. Unlike
16 * positive scaling steps where we shrink the monitoring window, a negative
17 * scaling step retains the default step==0 window size.
25 #include <linux/backing-dev.h>
28 #include "blk-stat.h"
29 #include "blk-wbt.h"
30 #include "blk-rq-qos.h"
76 * information to make a firm scale up/down decision.
103 rq->wbt_flags = 0; in wbt_clear_state()
108 return rq->wbt_flags; in wbt_flags()
113 return rq->wbt_flags & WBT_TRACKED; in wbt_is_tracked()
118 return rq->wbt_flags & WBT_READ; in wbt_is_read()
123 * Default setting, we'll scale up (to 75% of QD max) or down (min 1)
140 * information to scale up or down, slowly return to center state
148 return rwb && rwb->enable_state != WBT_STATE_OFF_DEFAULT && in rwb_enabled()
149 rwb->enable_state != WBT_STATE_OFF_MANUAL; in rwb_enabled()
168 struct backing_dev_info *bdi = rwb->rqos.disk->bdi; in wb_recent_wait()
170 return time_before(jiffies, bdi->last_bdp_sleep + HZ); in wb_recent_wait()
177 return &rwb->rq_wait[WBT_RWQ_SWAP]; in get_rq_wait()
179 return &rwb->rq_wait[WBT_RWQ_DISCARD]; in get_rq_wait()
181 return &rwb->rq_wait[WBT_RWQ_BG]; in get_rq_wait()
189 struct rq_wait *rqw = &rwb->rq_wait[i]; in rwb_wake_all()
191 if (wq_has_sleeper(&rqw->wait)) in rwb_wake_all()
192 wake_up_all(&rqw->wait); in rwb_wake_all()
201 inflight = atomic_dec_return(&rqw->inflight); in wbt_rqw_done()
205 * the device does write back caching, drop further down before we in wbt_rqw_done()
209 limit = rwb->wb_background; in wbt_rqw_done()
210 else if (blk_queue_write_cache(rwb->rqos.disk->queue) && in wbt_rqw_done()
214 limit = rwb->wb_normal; in wbt_rqw_done()
222 if (wq_has_sleeper(&rqw->wait)) { in wbt_rqw_done()
223 int diff = limit - inflight; in wbt_rqw_done()
225 if (!inflight || diff >= rwb->wb_background / 2) in wbt_rqw_done()
226 wake_up_all(&rqw->wait); in wbt_rqw_done()
252 if (rwb->sync_cookie == rq) { in wbt_done()
253 rwb->sync_issue = 0; in wbt_done()
254 rwb->sync_cookie = NULL; in wbt_done()
257 wb_timestamp(rwb, &rwb->last_comp); in wbt_done()
260 WARN_ON_ONCE(rq == rwb->sync_cookie); in wbt_done()
280 u64 issue = READ_ONCE(rwb->sync_issue); in rwb_sync_issue_lat()
282 if (!issue || !rwb->sync_cookie) in rwb_sync_issue_lat()
285 return blk_time_get_ns() - issue; in rwb_sync_issue_lat()
293 ret += atomic_read(&rwb->rq_wait[i].inflight); in wbt_inflight()
307 struct backing_dev_info *bdi = rwb->rqos.disk->bdi; in latency_exceeded()
308 struct rq_depth *rqd = &rwb->rq_depth; in latency_exceeded()
321 if (thislat > rwb->cur_win_nsec || in latency_exceeded()
322 (thislat > rwb->min_lat_nsec && !stat[READ].nr_samples)) { in latency_exceeded()
344 * If the 'min' latency exceeds our target, step down. in latency_exceeded()
346 if (stat[READ].min > rwb->min_lat_nsec) { in latency_exceeded()
352 if (rqd->scale_step) in latency_exceeded()
360 struct backing_dev_info *bdi = rwb->rqos.disk->bdi; in rwb_trace_step()
361 struct rq_depth *rqd = &rwb->rq_depth; in rwb_trace_step()
363 trace_wbt_step(bdi, msg, rqd->scale_step, rwb->cur_win_nsec, in rwb_trace_step()
364 rwb->wb_background, rwb->wb_normal, rqd->max_depth); in rwb_trace_step()
369 if (rwb->min_lat_nsec == 0) { in calc_wb_limits()
370 rwb->wb_normal = rwb->wb_background = 0; in calc_wb_limits()
371 } else if (rwb->rq_depth.max_depth <= 2) { in calc_wb_limits()
372 rwb->wb_normal = rwb->rq_depth.max_depth; in calc_wb_limits()
373 rwb->wb_background = 1; in calc_wb_limits()
375 rwb->wb_normal = (rwb->rq_depth.max_depth + 1) / 2; in calc_wb_limits()
376 rwb->wb_background = (rwb->rq_depth.max_depth + 3) / 4; in calc_wb_limits()
382 if (!rq_depth_scale_up(&rwb->rq_depth)) in scale_up()
385 rwb->unknown_cnt = 0; in scale_up()
392 if (!rq_depth_scale_down(&rwb->rq_depth, hard_throttle)) in scale_down()
395 rwb->unknown_cnt = 0; in scale_down()
396 rwb_trace_step(rwb, tracepoint_string("scale down")); in scale_down()
401 struct rq_depth *rqd = &rwb->rq_depth; in rwb_arm_timer()
403 if (rqd->scale_step > 0) { in rwb_arm_timer()
410 rwb->cur_win_nsec = div_u64(rwb->win_nsec << 4, in rwb_arm_timer()
411 int_sqrt((rqd->scale_step + 1) << 8)); in rwb_arm_timer()
417 rwb->cur_win_nsec = rwb->win_nsec; in rwb_arm_timer()
420 blk_stat_activate_nsecs(rwb->cb, rwb->cur_win_nsec); in rwb_arm_timer()
425 struct rq_wb *rwb = cb->data; in wb_timer_fn()
426 struct rq_depth *rqd = &rwb->rq_depth; in wb_timer_fn()
430 if (!rwb->rqos.disk) in wb_timer_fn()
433 status = latency_exceeded(rwb, cb->stat); in wb_timer_fn()
435 trace_wbt_timer(rwb->rqos.disk->bdi, status, rqd->scale_step, inflight); in wb_timer_fn()
438 * If we exceeded the latency target, step down. If we did not, in wb_timer_fn()
458 if (++rwb->unknown_cnt < RWB_UNKNOWN_BUMP) in wb_timer_fn()
465 if (rqd->scale_step > 0) in wb_timer_fn()
467 else if (rqd->scale_step < 0) in wb_timer_fn()
475 * Re-arm timer, if we have IO in flight in wb_timer_fn()
477 if (rqd->scale_step || inflight) in wb_timer_fn()
483 struct rq_depth *rqd = &rwb->rq_depth; in wbt_update_limits()
485 rqd->scale_step = 0; in wbt_update_limits()
486 rqd->scaled_max = false; in wbt_update_limits()
506 return RQWB(rqos)->min_lat_nsec; in wbt_get_min_lat()
515 RQWB(rqos)->min_lat_nsec = val; in wbt_set_min_lat()
517 RQWB(rqos)->enable_state = WBT_STATE_ON_MANUAL; in wbt_set_min_lat()
519 RQWB(rqos)->enable_state = WBT_STATE_OFF_MANUAL; in wbt_set_min_lat()
529 return time_before(now, rwb->last_issue + HZ / 10) || in close_io()
530 time_before(now, rwb->last_comp + HZ / 10); in close_io()
540 return rwb->wb_background; in get_limit()
551 limit = rwb->rq_depth.max_depth; in get_limit()
557 limit = rwb->wb_background; in get_limit()
559 limit = rwb->wb_normal; in get_limit()
573 return rq_wait_inc_below(rqw, get_limit(data->rwb, data->opf)); in wbt_inflight_cb()
579 wbt_rqw_done(data->rwb, rqw, data->wb_acct); in wbt_cleanup_cb()
606 if ((bio->bi_opf & (REQ_SYNC | REQ_IDLE)) == in wbt_should_throttle()
627 if (bio->bi_opf & REQ_SWAP) in bio_to_wbt_flags()
652 wb_timestamp(rwb, &rwb->last_issue); in wbt_wait()
656 __wbt_wait(rwb, flags, bio->bi_opf); in wbt_wait()
658 if (!blk_stat_is_active(rwb->cb)) in wbt_wait()
665 rq->wbt_flags |= bio_to_wbt_flags(rwb, bio); in wbt_track()
682 if (wbt_is_read(rq) && !rwb->sync_issue) { in wbt_issue()
683 rwb->sync_cookie = rq; in wbt_issue()
684 rwb->sync_issue = rq->io_start_time_ns; in wbt_issue()
693 if (rq == rwb->sync_cookie) { in wbt_requeue()
694 rwb->sync_issue = 0; in wbt_requeue()
695 rwb->sync_cookie = NULL; in wbt_requeue()
704 struct request_queue *q = disk->queue; in wbt_enable_default()
708 mutex_lock(&disk->rqos_state_mutex); in wbt_enable_default()
716 if (enable && RQWB(rqos)->enable_state == WBT_STATE_OFF_DEFAULT) in wbt_enable_default()
717 RQWB(rqos)->enable_state = WBT_STATE_ON_DEFAULT; in wbt_enable_default()
718 mutex_unlock(&disk->rqos_state_mutex); in wbt_enable_default()
721 mutex_unlock(&disk->rqos_state_mutex); in wbt_enable_default()
723 /* Queue not registered? Maybe shutting down... */ in wbt_enable_default()
735 * We default to 2msec for non-rotational storage, and 75msec in wbt_default_latency_nsec()
754 return -1; in wbt_data_dir()
759 RQWB(rqos)->rq_depth.queue_depth = blk_queue_depth(rqos->disk->queue); in wbt_queue_depth_changed()
767 blk_stat_remove_callback(rqos->disk->queue, rwb->cb); in wbt_exit()
768 blk_stat_free_callback(rwb->cb); in wbt_exit()
777 struct rq_qos *rqos = wbt_rq_qos(disk->queue); in wbt_disable_default()
781 mutex_lock(&disk->rqos_state_mutex); in wbt_disable_default()
783 if (rwb->enable_state == WBT_STATE_ON_DEFAULT) { in wbt_disable_default()
784 blk_stat_deactivate(rwb->cb); in wbt_disable_default()
785 rwb->enable_state = WBT_STATE_OFF_DEFAULT; in wbt_disable_default()
787 mutex_unlock(&disk->rqos_state_mutex); in wbt_disable_default()
797 seq_printf(m, "%llu\n", rwb->cur_win_nsec); in wbt_curr_win_nsec_show()
806 seq_printf(m, "%d\n", rwb->enable_state); in wbt_enabled_show()
814 seq_printf(m, "%u\n", rqos->id); in wbt_id_show()
826 atomic_read(&rwb->rq_wait[i].inflight)); in wbt_inflight_show()
835 seq_printf(m, "%lu\n", rwb->min_lat_nsec); in wbt_min_lat_nsec_show()
844 seq_printf(m, "%u\n", rwb->unknown_cnt); in wbt_unknown_cnt_show()
853 seq_printf(m, "%u\n", rwb->wb_normal); in wbt_normal_show()
862 seq_printf(m, "%u\n", rwb->wb_background); in wbt_background_show()
895 struct request_queue *q = disk->queue; in wbt_init()
902 return -ENOMEM; in wbt_init()
904 rwb->cb = blk_stat_alloc_callback(wb_timer_fn, wbt_data_dir, 2, rwb); in wbt_init()
905 if (!rwb->cb) { in wbt_init()
907 return -ENOMEM; in wbt_init()
911 rq_wait_init(&rwb->rq_wait[i]); in wbt_init()
913 rwb->last_comp = rwb->last_issue = jiffies; in wbt_init()
914 rwb->win_nsec = RWB_WINDOW_NSEC; in wbt_init()
915 rwb->enable_state = WBT_STATE_ON_DEFAULT; in wbt_init()
916 rwb->rq_depth.default_depth = RWB_DEF_DEPTH; in wbt_init()
917 rwb->min_lat_nsec = wbt_default_latency_nsec(q); in wbt_init()
918 rwb->rq_depth.queue_depth = blk_queue_depth(q); in wbt_init()
924 mutex_lock(&q->rq_qos_mutex); in wbt_init()
925 ret = rq_qos_add(&rwb->rqos, disk, RQ_QOS_WBT, &wbt_rqos_ops); in wbt_init()
926 mutex_unlock(&q->rq_qos_mutex); in wbt_init()
930 blk_stat_add_callback(q, rwb->cb); in wbt_init()
935 blk_stat_free_callback(rwb->cb); in wbt_init()