blob: 2944c129760ce56f060962132006aba1b0a4ed5e [file] [log] [blame]
Christoph Hellwig3dcf60b2019-04-30 14:42:43 -04001// SPDX-License-Identifier: GPL-2.0
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 * Block device elevator/IO-scheduler.
4 *
5 * Copyright (C) 2000 Andrea Arcangeli <andrea@suse.de> SuSE
6 *
Jens Axboe0fe23472006-09-04 15:41:16 +02007 * 30042000 Jens Axboe <axboe@kernel.dk> :
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 *
9 * Split the elevator a bit so that it is possible to choose a different
10 * one or even write a new "plug in". There are three pieces:
11 * - elevator_fn, inserts a new request in the queue list
12 * - elevator_merge_fn, decides whether a new buffer can be merged with
13 * an existing request
14 * - elevator_dequeue_fn, called when a request is taken off the active list
15 *
16 * 20082000 Dave Jones <davej@suse.de> :
17 * Removed tests for max-bomb-segments, which was breaking elvtune
18 * when run without -bN
19 *
20 * Jens:
21 * - Rework again to work with bio instead of buffer_heads
22 * - loose bi_dev comparisons, partition handling is right now
23 * - completely modularize elevator setup and teardown
24 *
25 */
26#include <linux/kernel.h>
27#include <linux/fs.h>
28#include <linux/blkdev.h>
29#include <linux/elevator.h>
30#include <linux/bio.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070031#include <linux/module.h>
32#include <linux/slab.h>
33#include <linux/init.h>
34#include <linux/compiler.h>
Jens Axboe2056a782006-03-23 20:00:26 +010035#include <linux/blktrace_api.h>
Jens Axboe98170642006-07-28 09:23:08 +020036#include <linux/hash.h>
Jens Axboe0835da62008-08-26 09:15:47 +020037#include <linux/uaccess.h>
Lin Mingc8158812013-03-23 11:42:27 +080038#include <linux/pm_runtime.h>
Tejun Heoeea8f412015-05-22 17:13:17 -040039#include <linux/blk-cgroup.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070040
Li Zefan55782132009-06-09 13:43:05 +080041#include <trace/events/block.h>
42
Jens Axboe242f9dc2008-09-14 05:55:09 -070043#include "blk.h"
Jens Axboebd166ef2017-01-17 06:03:22 -070044#include "blk-mq-sched.h"
Bart Van Asschebca6b062018-09-26 14:01:03 -070045#include "blk-pm.h"
Jan Kara8330cdb2017-04-19 11:33:27 +020046#include "blk-wbt.h"
Jens Axboe242f9dc2008-09-14 05:55:09 -070047
Linus Torvalds1da177e2005-04-16 15:20:36 -070048static DEFINE_SPINLOCK(elv_list_lock);
49static LIST_HEAD(elv_list);
50
51/*
Jens Axboe98170642006-07-28 09:23:08 +020052 * Merge hash stuff.
53 */
Tejun Heo83096eb2009-05-07 22:24:39 +090054#define rq_hash_key(rq) (blk_rq_pos(rq) + blk_rq_sectors(rq))
Jens Axboe98170642006-07-28 09:23:08 +020055
56/*
Jens Axboeda775262006-12-20 11:04:12 +010057 * Query io scheduler to see if the current process issuing bio may be
58 * merged with rq.
59 */
Tahsin Erdogan72ef7992016-07-07 11:48:22 -070060static int elv_iosched_allow_bio_merge(struct request *rq, struct bio *bio)
Jens Axboeda775262006-12-20 11:04:12 +010061{
Jens Axboe165125e2007-07-24 09:28:11 +020062 struct request_queue *q = rq->q;
Jens Axboeb374d182008-10-31 10:05:07 +010063 struct elevator_queue *e = q->elevator;
Jens Axboeda775262006-12-20 11:04:12 +010064
Jens Axboef9cd4bf2018-11-01 16:41:41 -060065 if (e->type->ops.allow_merge)
66 return e->type->ops.allow_merge(q, rq, bio);
Jens Axboeda775262006-12-20 11:04:12 +010067
68 return 1;
69}
70
71/*
Linus Torvalds1da177e2005-04-16 15:20:36 -070072 * can we safely merge with this request?
73 */
Tahsin Erdogan72ef7992016-07-07 11:48:22 -070074bool elv_bio_merge_ok(struct request *rq, struct bio *bio)
Linus Torvalds1da177e2005-04-16 15:20:36 -070075{
Tejun Heo050c8ea2012-02-08 09:19:38 +010076 if (!blk_rq_merge_ok(rq, bio))
Tahsin Erdogan72ef7992016-07-07 11:48:22 -070077 return false;
Martin K. Petersen7ba1ba12008-06-30 20:04:41 +020078
Tahsin Erdogan72ef7992016-07-07 11:48:22 -070079 if (!elv_iosched_allow_bio_merge(rq, bio))
80 return false;
Jens Axboeda775262006-12-20 11:04:12 +010081
Tahsin Erdogan72ef7992016-07-07 11:48:22 -070082 return true;
Linus Torvalds1da177e2005-04-16 15:20:36 -070083}
Tahsin Erdogan72ef7992016-07-07 11:48:22 -070084EXPORT_SYMBOL(elv_bio_merge_ok);
Linus Torvalds1da177e2005-04-16 15:20:36 -070085
Jens Axboe8ac0d9a2017-10-25 12:35:02 -060086static bool elevator_match(const struct elevator_type *e, const char *name)
87{
88 if (!strcmp(e->elevator_name, name))
89 return true;
90 if (e->elevator_alias && !strcmp(e->elevator_alias, name))
91 return true;
92
93 return false;
94}
95
Jens Axboe2527d992017-10-25 12:33:42 -060096/*
Jens Axboea1ce35f2018-10-29 10:23:51 -060097 * Return scheduler with name 'name'
Jens Axboe2527d992017-10-25 12:33:42 -060098 */
Jens Axboea1ce35f2018-10-29 10:23:51 -060099static struct elevator_type *elevator_find(const char *name)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100{
Vasily Tarasova22b1692006-10-11 09:24:27 +0200101 struct elevator_type *e;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102
Matthias Kaehlcke70cee262007-07-10 12:26:24 +0200103 list_for_each_entry(e, &elv_list, list) {
Jens Axboea1ce35f2018-10-29 10:23:51 -0600104 if (elevator_match(e, name))
Vasily Tarasova22b1692006-10-11 09:24:27 +0200105 return e;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107
Vasily Tarasova22b1692006-10-11 09:24:27 +0200108 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109}
110
111static void elevator_put(struct elevator_type *e)
112{
113 module_put(e->elevator_owner);
114}
115
Jens Axboe2527d992017-10-25 12:33:42 -0600116static struct elevator_type *elevator_get(struct request_queue *q,
117 const char *name, bool try_loading)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118{
Tejun Heo2824bc932005-10-20 10:56:41 +0200119 struct elevator_type *e;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200121 spin_lock(&elv_list_lock);
Tejun Heo2824bc932005-10-20 10:56:41 +0200122
Jens Axboea1ce35f2018-10-29 10:23:51 -0600123 e = elevator_find(name);
Tejun Heo21c3c5d2013-01-22 16:48:03 -0800124 if (!e && try_loading) {
Jens Axboee1640942008-02-19 10:20:37 +0100125 spin_unlock(&elv_list_lock);
Kees Cook490b94b2011-05-05 18:02:12 -0600126 request_module("%s-iosched", name);
Jens Axboee1640942008-02-19 10:20:37 +0100127 spin_lock(&elv_list_lock);
Jens Axboea1ce35f2018-10-29 10:23:51 -0600128 e = elevator_find(name);
Jens Axboee1640942008-02-19 10:20:37 +0100129 }
130
Tejun Heo2824bc932005-10-20 10:56:41 +0200131 if (e && !try_module_get(e->elevator_owner))
132 e = NULL;
133
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200134 spin_unlock(&elv_list_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 return e;
136}
137
Al Viro3d1ab402006-03-18 18:35:43 -0500138static struct kobj_type elv_ktype;
139
Jianpeng Mad50235b2013-07-03 13:25:24 +0200140struct elevator_queue *elevator_alloc(struct request_queue *q,
Jens Axboe165125e2007-07-24 09:28:11 +0200141 struct elevator_type *e)
Al Viro3d1ab402006-03-18 18:35:43 -0500142{
Jens Axboeb374d182008-10-31 10:05:07 +0100143 struct elevator_queue *eq;
Jens Axboe98170642006-07-28 09:23:08 +0200144
Joe Perchesc1b511e2013-08-29 15:21:42 -0700145 eq = kzalloc_node(sizeof(*eq), GFP_KERNEL, q->node);
Jens Axboe98170642006-07-28 09:23:08 +0200146 if (unlikely(!eq))
Chao Yu8406a4d2015-04-23 10:47:44 -0600147 return NULL;
Jens Axboe98170642006-07-28 09:23:08 +0200148
Tejun Heo22f746e2011-12-14 00:33:41 +0100149 eq->type = e;
Greg Kroah-Hartmanf9cb0742007-12-17 23:05:35 -0700150 kobject_init(&eq->kobj, &elv_ktype);
Jens Axboe98170642006-07-28 09:23:08 +0200151 mutex_init(&eq->sysfs_lock);
Sasha Levin242d98f2012-12-17 10:01:27 -0500152 hash_init(eq->hash);
Jens Axboe98170642006-07-28 09:23:08 +0200153
Al Viro3d1ab402006-03-18 18:35:43 -0500154 return eq;
155}
Jianpeng Mad50235b2013-07-03 13:25:24 +0200156EXPORT_SYMBOL(elevator_alloc);
Al Viro3d1ab402006-03-18 18:35:43 -0500157
158static void elevator_release(struct kobject *kobj)
159{
Jens Axboeb374d182008-10-31 10:05:07 +0100160 struct elevator_queue *e;
Jens Axboe98170642006-07-28 09:23:08 +0200161
Jens Axboeb374d182008-10-31 10:05:07 +0100162 e = container_of(kobj, struct elevator_queue, kobj);
Tejun Heo22f746e2011-12-14 00:33:41 +0100163 elevator_put(e->type);
Al Viro3d1ab402006-03-18 18:35:43 -0500164 kfree(e);
165}
166
Ming Leic3e22192019-06-04 21:08:02 +0800167void __elevator_exit(struct request_queue *q, struct elevator_queue *e)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168{
Al Viro3d1ab402006-03-18 18:35:43 -0500169 mutex_lock(&e->sysfs_lock);
Jens Axboef9cd4bf2018-11-01 16:41:41 -0600170 if (e->type->ops.exit_sched)
Omar Sandoval54d53292017-04-07 08:52:27 -0600171 blk_mq_exit_sched(q, e);
Al Viro3d1ab402006-03-18 18:35:43 -0500172 mutex_unlock(&e->sysfs_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173
Al Viro3d1ab402006-03-18 18:35:43 -0500174 kobject_put(&e->kobj);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175}
Jens Axboe2e662b62006-07-13 11:55:04 +0200176
Jens Axboe98170642006-07-28 09:23:08 +0200177static inline void __elv_rqhash_del(struct request *rq)
178{
Sasha Levin242d98f2012-12-17 10:01:27 -0500179 hash_del(&rq->hash);
Christoph Hellwige8064022016-10-20 15:12:13 +0200180 rq->rq_flags &= ~RQF_HASHED;
Jens Axboe98170642006-07-28 09:23:08 +0200181}
182
Jens Axboe70b3ea02016-12-07 08:43:31 -0700183void elv_rqhash_del(struct request_queue *q, struct request *rq)
Jens Axboe98170642006-07-28 09:23:08 +0200184{
185 if (ELV_ON_HASH(rq))
186 __elv_rqhash_del(rq);
187}
Jens Axboebd166ef2017-01-17 06:03:22 -0700188EXPORT_SYMBOL_GPL(elv_rqhash_del);
Jens Axboe98170642006-07-28 09:23:08 +0200189
Jens Axboe70b3ea02016-12-07 08:43:31 -0700190void elv_rqhash_add(struct request_queue *q, struct request *rq)
Jens Axboe98170642006-07-28 09:23:08 +0200191{
Jens Axboeb374d182008-10-31 10:05:07 +0100192 struct elevator_queue *e = q->elevator;
Jens Axboe98170642006-07-28 09:23:08 +0200193
194 BUG_ON(ELV_ON_HASH(rq));
Sasha Levin242d98f2012-12-17 10:01:27 -0500195 hash_add(e->hash, &rq->hash, rq_hash_key(rq));
Christoph Hellwige8064022016-10-20 15:12:13 +0200196 rq->rq_flags |= RQF_HASHED;
Jens Axboe98170642006-07-28 09:23:08 +0200197}
Jens Axboebd166ef2017-01-17 06:03:22 -0700198EXPORT_SYMBOL_GPL(elv_rqhash_add);
Jens Axboe98170642006-07-28 09:23:08 +0200199
Jens Axboe70b3ea02016-12-07 08:43:31 -0700200void elv_rqhash_reposition(struct request_queue *q, struct request *rq)
Jens Axboe98170642006-07-28 09:23:08 +0200201{
202 __elv_rqhash_del(rq);
203 elv_rqhash_add(q, rq);
204}
205
Jens Axboe70b3ea02016-12-07 08:43:31 -0700206struct request *elv_rqhash_find(struct request_queue *q, sector_t offset)
Jens Axboe98170642006-07-28 09:23:08 +0200207{
Jens Axboeb374d182008-10-31 10:05:07 +0100208 struct elevator_queue *e = q->elevator;
Sasha Levinb67bfe02013-02-27 17:06:00 -0800209 struct hlist_node *next;
Jens Axboe98170642006-07-28 09:23:08 +0200210 struct request *rq;
211
Linus Torvaldsee89f812013-02-28 12:52:24 -0800212 hash_for_each_possible_safe(e->hash, rq, next, hash, offset) {
Jens Axboe98170642006-07-28 09:23:08 +0200213 BUG_ON(!ELV_ON_HASH(rq));
214
215 if (unlikely(!rq_mergeable(rq))) {
216 __elv_rqhash_del(rq);
217 continue;
218 }
219
220 if (rq_hash_key(rq) == offset)
221 return rq;
222 }
223
224 return NULL;
225}
226
Tejun Heo8922e162005-10-20 16:23:44 +0200227/*
Jens Axboe2e662b62006-07-13 11:55:04 +0200228 * RB-tree support functions for inserting/lookup/removal of requests
229 * in a sorted RB tree.
230 */
Jeff Moyer796d5112011-06-02 21:19:05 +0200231void elv_rb_add(struct rb_root *root, struct request *rq)
Jens Axboe2e662b62006-07-13 11:55:04 +0200232{
233 struct rb_node **p = &root->rb_node;
234 struct rb_node *parent = NULL;
235 struct request *__rq;
236
237 while (*p) {
238 parent = *p;
239 __rq = rb_entry(parent, struct request, rb_node);
240
Tejun Heo83096eb2009-05-07 22:24:39 +0900241 if (blk_rq_pos(rq) < blk_rq_pos(__rq))
Jens Axboe2e662b62006-07-13 11:55:04 +0200242 p = &(*p)->rb_left;
Jeff Moyer796d5112011-06-02 21:19:05 +0200243 else if (blk_rq_pos(rq) >= blk_rq_pos(__rq))
Jens Axboe2e662b62006-07-13 11:55:04 +0200244 p = &(*p)->rb_right;
Jens Axboe2e662b62006-07-13 11:55:04 +0200245 }
246
247 rb_link_node(&rq->rb_node, parent, p);
248 rb_insert_color(&rq->rb_node, root);
Jens Axboe2e662b62006-07-13 11:55:04 +0200249}
Jens Axboe2e662b62006-07-13 11:55:04 +0200250EXPORT_SYMBOL(elv_rb_add);
251
252void elv_rb_del(struct rb_root *root, struct request *rq)
253{
254 BUG_ON(RB_EMPTY_NODE(&rq->rb_node));
255 rb_erase(&rq->rb_node, root);
256 RB_CLEAR_NODE(&rq->rb_node);
257}
Jens Axboe2e662b62006-07-13 11:55:04 +0200258EXPORT_SYMBOL(elv_rb_del);
259
260struct request *elv_rb_find(struct rb_root *root, sector_t sector)
261{
262 struct rb_node *n = root->rb_node;
263 struct request *rq;
264
265 while (n) {
266 rq = rb_entry(n, struct request, rb_node);
267
Tejun Heo83096eb2009-05-07 22:24:39 +0900268 if (sector < blk_rq_pos(rq))
Jens Axboe2e662b62006-07-13 11:55:04 +0200269 n = n->rb_left;
Tejun Heo83096eb2009-05-07 22:24:39 +0900270 else if (sector > blk_rq_pos(rq))
Jens Axboe2e662b62006-07-13 11:55:04 +0200271 n = n->rb_right;
272 else
273 return rq;
274 }
275
276 return NULL;
277}
Jens Axboe2e662b62006-07-13 11:55:04 +0200278EXPORT_SYMBOL(elv_rb_find);
279
Christoph Hellwig34fe7c02017-02-08 14:46:48 +0100280enum elv_merge elv_merge(struct request_queue *q, struct request **req,
281 struct bio *bio)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282{
Jens Axboeb374d182008-10-31 10:05:07 +0100283 struct elevator_queue *e = q->elevator;
Jens Axboe98170642006-07-28 09:23:08 +0200284 struct request *__rq;
Tejun Heo06b86242005-10-20 16:46:23 +0200285
Jens Axboe98170642006-07-28 09:23:08 +0200286 /*
Alan D. Brunelle488991e2010-01-29 09:04:08 +0100287 * Levels of merges:
288 * nomerges: No merges at all attempted
289 * noxmerges: Only simple one-hit cache try
290 * merges: All merge tries attempted
291 */
Ming Lei7460d382015-10-20 23:13:55 +0800292 if (blk_queue_nomerges(q) || !bio_mergeable(bio))
Alan D. Brunelle488991e2010-01-29 09:04:08 +0100293 return ELEVATOR_NO_MERGE;
294
295 /*
Jens Axboe98170642006-07-28 09:23:08 +0200296 * First try one-hit cache.
297 */
Tahsin Erdogan72ef7992016-07-07 11:48:22 -0700298 if (q->last_merge && elv_bio_merge_ok(q->last_merge, bio)) {
Christoph Hellwig34fe7c02017-02-08 14:46:48 +0100299 enum elv_merge ret = blk_try_merge(q->last_merge, bio);
300
Tejun Heo06b86242005-10-20 16:46:23 +0200301 if (ret != ELEVATOR_NO_MERGE) {
302 *req = q->last_merge;
303 return ret;
304 }
305 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306
Alan D. Brunelle488991e2010-01-29 09:04:08 +0100307 if (blk_queue_noxmerges(q))
Alan D. Brunelleac9fafa2008-04-29 14:44:19 +0200308 return ELEVATOR_NO_MERGE;
309
Jens Axboe98170642006-07-28 09:23:08 +0200310 /*
311 * See if our hash lookup can find a potential backmerge.
312 */
Kent Overstreet4f024f32013-10-11 15:44:27 -0700313 __rq = elv_rqhash_find(q, bio->bi_iter.bi_sector);
Tahsin Erdogan72ef7992016-07-07 11:48:22 -0700314 if (__rq && elv_bio_merge_ok(__rq, bio)) {
Jens Axboe98170642006-07-28 09:23:08 +0200315 *req = __rq;
316 return ELEVATOR_BACK_MERGE;
317 }
318
Jens Axboef9cd4bf2018-11-01 16:41:41 -0600319 if (e->type->ops.request_merge)
320 return e->type->ops.request_merge(q, req, bio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321
322 return ELEVATOR_NO_MERGE;
323}
324
Jens Axboe5e84ea32011-03-21 10:14:27 +0100325/*
326 * Attempt to do an insertion back merge. Only check for the case where
327 * we can append 'rq' to an existing request, so we can throw 'rq' away
328 * afterwards.
329 *
330 * Returns true if we merged, false otherwise
331 */
Jens Axboebd166ef2017-01-17 06:03:22 -0700332bool elv_attempt_insert_merge(struct request_queue *q, struct request *rq)
Jens Axboe5e84ea32011-03-21 10:14:27 +0100333{
334 struct request *__rq;
Shaohua Libee03932012-11-09 08:44:27 +0100335 bool ret;
Jens Axboe5e84ea32011-03-21 10:14:27 +0100336
337 if (blk_queue_nomerges(q))
338 return false;
339
340 /*
341 * First try one-hit cache.
342 */
343 if (q->last_merge && blk_attempt_req_merge(q, q->last_merge, rq))
344 return true;
345
346 if (blk_queue_noxmerges(q))
347 return false;
348
Shaohua Libee03932012-11-09 08:44:27 +0100349 ret = false;
Jens Axboe5e84ea32011-03-21 10:14:27 +0100350 /*
351 * See if our hash lookup can find a potential backmerge.
352 */
Shaohua Libee03932012-11-09 08:44:27 +0100353 while (1) {
354 __rq = elv_rqhash_find(q, blk_rq_pos(rq));
355 if (!__rq || !blk_attempt_req_merge(q, __rq, rq))
356 break;
Jens Axboe5e84ea32011-03-21 10:14:27 +0100357
Shaohua Libee03932012-11-09 08:44:27 +0100358 /* The merged request could be merged with others, try again */
359 ret = true;
360 rq = __rq;
361 }
362
363 return ret;
Jens Axboe5e84ea32011-03-21 10:14:27 +0100364}
365
Christoph Hellwig34fe7c02017-02-08 14:46:48 +0100366void elv_merged_request(struct request_queue *q, struct request *rq,
367 enum elv_merge type)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368{
Jens Axboeb374d182008-10-31 10:05:07 +0100369 struct elevator_queue *e = q->elevator;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370
Jens Axboef9cd4bf2018-11-01 16:41:41 -0600371 if (e->type->ops.request_merged)
372 e->type->ops.request_merged(q, rq, type);
Tejun Heo06b86242005-10-20 16:46:23 +0200373
Jens Axboe2e662b62006-07-13 11:55:04 +0200374 if (type == ELEVATOR_BACK_MERGE)
375 elv_rqhash_reposition(q, rq);
Jens Axboe98170642006-07-28 09:23:08 +0200376
Tejun Heo06b86242005-10-20 16:46:23 +0200377 q->last_merge = rq;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378}
379
Jens Axboe165125e2007-07-24 09:28:11 +0200380void elv_merge_requests(struct request_queue *q, struct request *rq,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 struct request *next)
382{
Jens Axboeb374d182008-10-31 10:05:07 +0100383 struct elevator_queue *e = q->elevator;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384
Jens Axboef9cd4bf2018-11-01 16:41:41 -0600385 if (e->type->ops.requests_merged)
386 e->type->ops.requests_merged(q, rq, next);
Tejun Heo06b86242005-10-20 16:46:23 +0200387
Jens Axboe98170642006-07-28 09:23:08 +0200388 elv_rqhash_reposition(q, rq);
Tejun Heo06b86242005-10-20 16:46:23 +0200389 q->last_merge = rq;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390}
391
Jens Axboe165125e2007-07-24 09:28:11 +0200392struct request *elv_latter_request(struct request_queue *q, struct request *rq)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393{
Jens Axboeb374d182008-10-31 10:05:07 +0100394 struct elevator_queue *e = q->elevator;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395
Jens Axboef9cd4bf2018-11-01 16:41:41 -0600396 if (e->type->ops.next_request)
397 return e->type->ops.next_request(q, rq);
Jens Axboebd166ef2017-01-17 06:03:22 -0700398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 return NULL;
400}
401
Jens Axboe165125e2007-07-24 09:28:11 +0200402struct request *elv_former_request(struct request_queue *q, struct request *rq)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403{
Jens Axboeb374d182008-10-31 10:05:07 +0100404 struct elevator_queue *e = q->elevator;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700405
Jens Axboef9cd4bf2018-11-01 16:41:41 -0600406 if (e->type->ops.former_request)
407 return e->type->ops.former_request(q, rq);
Jens Axboea1ce35f2018-10-29 10:23:51 -0600408
Linus Torvalds1da177e2005-04-16 15:20:36 -0700409 return NULL;
410}
411
Al Viro3d1ab402006-03-18 18:35:43 -0500412#define to_elv(atr) container_of((atr), struct elv_fs_entry, attr)
413
414static ssize_t
415elv_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
416{
Al Viro3d1ab402006-03-18 18:35:43 -0500417 struct elv_fs_entry *entry = to_elv(attr);
Jens Axboeb374d182008-10-31 10:05:07 +0100418 struct elevator_queue *e;
Al Viro3d1ab402006-03-18 18:35:43 -0500419 ssize_t error;
420
421 if (!entry->show)
422 return -EIO;
423
Jens Axboeb374d182008-10-31 10:05:07 +0100424 e = container_of(kobj, struct elevator_queue, kobj);
Al Viro3d1ab402006-03-18 18:35:43 -0500425 mutex_lock(&e->sysfs_lock);
Tejun Heo22f746e2011-12-14 00:33:41 +0100426 error = e->type ? entry->show(e, page) : -ENOENT;
Al Viro3d1ab402006-03-18 18:35:43 -0500427 mutex_unlock(&e->sysfs_lock);
428 return error;
429}
430
431static ssize_t
432elv_attr_store(struct kobject *kobj, struct attribute *attr,
433 const char *page, size_t length)
434{
Al Viro3d1ab402006-03-18 18:35:43 -0500435 struct elv_fs_entry *entry = to_elv(attr);
Jens Axboeb374d182008-10-31 10:05:07 +0100436 struct elevator_queue *e;
Al Viro3d1ab402006-03-18 18:35:43 -0500437 ssize_t error;
438
439 if (!entry->store)
440 return -EIO;
441
Jens Axboeb374d182008-10-31 10:05:07 +0100442 e = container_of(kobj, struct elevator_queue, kobj);
Al Viro3d1ab402006-03-18 18:35:43 -0500443 mutex_lock(&e->sysfs_lock);
Tejun Heo22f746e2011-12-14 00:33:41 +0100444 error = e->type ? entry->store(e, page, length) : -ENOENT;
Al Viro3d1ab402006-03-18 18:35:43 -0500445 mutex_unlock(&e->sysfs_lock);
446 return error;
447}
448
Emese Revfy52cf25d2010-01-19 02:58:23 +0100449static const struct sysfs_ops elv_sysfs_ops = {
Al Viro3d1ab402006-03-18 18:35:43 -0500450 .show = elv_attr_show,
451 .store = elv_attr_store,
452};
453
454static struct kobj_type elv_ktype = {
455 .sysfs_ops = &elv_sysfs_ops,
456 .release = elevator_release,
457};
458
Ming Leicecf5d82019-08-27 19:01:48 +0800459/*
460 * elv_register_queue is called from either blk_register_queue or
461 * elevator_switch, elevator switch is prevented from being happen
462 * in the two paths, so it is safe to not hold q->sysfs_lock.
463 */
464int elv_register_queue(struct request_queue *q, bool uevent)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465{
Tejun Heo5a5bafd2012-03-05 13:14:56 -0800466 struct elevator_queue *e = q->elevator;
Al Viro3d1ab402006-03-18 18:35:43 -0500467 int error;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700468
Greg Kroah-Hartmanb2d6db52007-12-17 23:05:35 -0700469 error = kobject_add(&e->kobj, &q->kobj, "%s", "iosched");
Al Viro3d1ab402006-03-18 18:35:43 -0500470 if (!error) {
Tejun Heo22f746e2011-12-14 00:33:41 +0100471 struct elv_fs_entry *attr = e->type->elevator_attrs;
Al Viro3d1ab402006-03-18 18:35:43 -0500472 if (attr) {
Al Viroe572ec72006-03-18 22:27:18 -0500473 while (attr->attr.name) {
474 if (sysfs_create_file(&e->kobj, &attr->attr))
Al Viro3d1ab402006-03-18 18:35:43 -0500475 break;
Al Viroe572ec72006-03-18 22:27:18 -0500476 attr++;
Al Viro3d1ab402006-03-18 18:35:43 -0500477 }
478 }
Ming Leicecf5d82019-08-27 19:01:48 +0800479 if (uevent)
480 kobject_uevent(&e->kobj, KOBJ_ADD);
481
482 mutex_lock(&q->sysfs_lock);
Jens Axboe430c62f2010-10-07 09:35:16 +0200483 e->registered = 1;
Ming Leicecf5d82019-08-27 19:01:48 +0800484 mutex_unlock(&q->sysfs_lock);
Al Viro3d1ab402006-03-18 18:35:43 -0500485 }
486 return error;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487}
Jens Axboebc1c1162006-06-08 08:49:06 +0200488
Ming Leicecf5d82019-08-27 19:01:48 +0800489/*
490 * elv_unregister_queue is called from either blk_unregister_queue or
491 * elevator_switch, elevator switch is prevented from being happen
492 * in the two paths, so it is safe to not hold q->sysfs_lock.
493 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494void elv_unregister_queue(struct request_queue *q)
495{
Tejun Heof8fc8772011-12-14 00:33:40 +0100496 if (q) {
497 struct elevator_queue *e = q->elevator;
498
499 kobject_uevent(&e->kobj, KOBJ_REMOVE);
500 kobject_del(&e->kobj);
Ming Leicecf5d82019-08-27 19:01:48 +0800501
502 mutex_lock(&q->sysfs_lock);
Tejun Heof8fc8772011-12-14 00:33:40 +0100503 e->registered = 0;
Jan Kara8330cdb2017-04-19 11:33:27 +0200504 /* Re-enable throttling in case elevator disabled it */
505 wbt_enable_default(q);
Ming Leicecf5d82019-08-27 19:01:48 +0800506 mutex_unlock(&q->sysfs_lock);
Tejun Heof8fc8772011-12-14 00:33:40 +0100507 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508}
509
Jens Axboee567bf72014-06-22 16:32:48 -0600510int elv_register(struct elevator_type *e)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511{
Tejun Heo3d3c2372011-12-14 00:33:42 +0100512 /* create icq_cache if requested */
513 if (e->icq_size) {
514 if (WARN_ON(e->icq_size < sizeof(struct io_cq)) ||
515 WARN_ON(e->icq_align < __alignof__(struct io_cq)))
516 return -EINVAL;
517
518 snprintf(e->icq_cache_name, sizeof(e->icq_cache_name),
519 "%s_io_cq", e->elevator_name);
520 e->icq_cache = kmem_cache_create(e->icq_cache_name, e->icq_size,
521 e->icq_align, 0, NULL);
522 if (!e->icq_cache)
523 return -ENOMEM;
524 }
525
526 /* register, don't allow duplicate names */
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200527 spin_lock(&elv_list_lock);
Jens Axboea1ce35f2018-10-29 10:23:51 -0600528 if (elevator_find(e->elevator_name)) {
Tejun Heo3d3c2372011-12-14 00:33:42 +0100529 spin_unlock(&elv_list_lock);
Chengguang Xu62d2a192018-08-28 07:31:11 +0800530 kmem_cache_destroy(e->icq_cache);
Tejun Heo3d3c2372011-12-14 00:33:42 +0100531 return -EBUSY;
532 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533 list_add_tail(&e->list, &elv_list);
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200534 spin_unlock(&elv_list_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700535
Hisao Tanabed0b0a812019-04-08 00:27:42 +0900536 printk(KERN_INFO "io scheduler %s registered\n", e->elevator_name);
537
Tejun Heo3d3c2372011-12-14 00:33:42 +0100538 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700539}
540EXPORT_SYMBOL_GPL(elv_register);
541
542void elv_unregister(struct elevator_type *e)
543{
Tejun Heo3d3c2372011-12-14 00:33:42 +0100544 /* unregister */
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200545 spin_lock(&elv_list_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546 list_del_init(&e->list);
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200547 spin_unlock(&elv_list_lock);
Tejun Heo3d3c2372011-12-14 00:33:42 +0100548
549 /*
550 * Destroy icq_cache if it exists. icq's are RCU managed. Make
551 * sure all RCU operations are complete before proceeding.
552 */
553 if (e->icq_cache) {
554 rcu_barrier();
555 kmem_cache_destroy(e->icq_cache);
556 e->icq_cache = NULL;
557 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700558}
559EXPORT_SYMBOL_GPL(elv_unregister);
560
Jianchao Wangd48ece22018-08-21 15:15:03 +0800561int elevator_switch_mq(struct request_queue *q,
Omar Sandoval54d53292017-04-07 08:52:27 -0600562 struct elevator_type *new_e)
563{
564 int ret;
565
Bart Van Assche14a23492018-01-17 11:48:09 -0800566 lockdep_assert_held(&q->sysfs_lock);
567
Omar Sandoval54d53292017-04-07 08:52:27 -0600568 if (q->elevator) {
Ming Leicecf5d82019-08-27 19:01:48 +0800569 if (q->elevator->registered) {
570 mutex_unlock(&q->sysfs_lock);
571
572 /*
573 * Concurrent elevator switch can't happen becasue
574 * sysfs write is always exclusively on same file.
575 *
576 * Also the elevator queue won't be freed after
577 * sysfs_lock is released becasue kobject_del() in
578 * blk_unregister_queue() waits for completion of
579 * .store & .show on its attributes.
580 */
Omar Sandoval54d53292017-04-07 08:52:27 -0600581 elv_unregister_queue(q);
Ming Leicecf5d82019-08-27 19:01:48 +0800582
583 mutex_lock(&q->sysfs_lock);
584 }
Omar Sandoval54d53292017-04-07 08:52:27 -0600585 ioc_clear_queue(q);
586 elevator_exit(q, q->elevator);
Ming Leicecf5d82019-08-27 19:01:48 +0800587
588 /*
589 * sysfs_lock may be dropped, so re-check if queue is
590 * unregistered. If yes, don't switch to new elevator
591 * any more
592 */
593 if (!blk_queue_registered(q))
594 return 0;
Omar Sandoval54d53292017-04-07 08:52:27 -0600595 }
596
597 ret = blk_mq_init_sched(q, new_e);
598 if (ret)
599 goto out;
600
601 if (new_e) {
Ming Leicecf5d82019-08-27 19:01:48 +0800602 mutex_unlock(&q->sysfs_lock);
603
604 ret = elv_register_queue(q, true);
605
606 mutex_lock(&q->sysfs_lock);
Omar Sandoval54d53292017-04-07 08:52:27 -0600607 if (ret) {
608 elevator_exit(q, q->elevator);
609 goto out;
610 }
611 }
612
613 if (new_e)
614 blk_add_trace_msg(q, "elv switch: %s", new_e->elevator_name);
615 else
616 blk_add_trace_msg(q, "elv switch: none");
617
618out:
Omar Sandoval54d53292017-04-07 08:52:27 -0600619 return ret;
Omar Sandoval54d53292017-04-07 08:52:27 -0600620}
621
Damien Le Moal61db4372019-09-05 18:51:29 +0900622static inline bool elv_support_iosched(struct request_queue *q)
623{
624 if (q->tag_set && (q->tag_set->flags & BLK_MQ_F_NO_SCHED))
625 return false;
626 return true;
627}
628
Linus Torvalds1da177e2005-04-16 15:20:36 -0700629/*
Damien Le Moal61db4372019-09-05 18:51:29 +0900630 * For blk-mq devices supporting IO scheduling, we default to using mq-deadline,
Damien Le Moal954b4a52019-09-05 18:51:30 +0900631 * if available, for single queue devices. If deadline isn't available OR
632 * deadline initialization fails OR we have multiple queues, default to "none".
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200633 */
Damien Le Moal954b4a52019-09-05 18:51:30 +0900634void elevator_init_mq(struct request_queue *q)
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200635{
636 struct elevator_type *e;
Damien Le Moal954b4a52019-09-05 18:51:30 +0900637 int err;
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200638
Damien Le Moal61db4372019-09-05 18:51:29 +0900639 if (!elv_support_iosched(q))
Damien Le Moal954b4a52019-09-05 18:51:30 +0900640 return;
Damien Le Moal61db4372019-09-05 18:51:29 +0900641
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200642 if (q->nr_hw_queues != 1)
Damien Le Moal954b4a52019-09-05 18:51:30 +0900643 return;
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200644
Ming Leic48dac12019-08-27 19:01:45 +0800645 WARN_ON_ONCE(test_bit(QUEUE_FLAG_REGISTERED, &q->queue_flags));
646
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200647 if (unlikely(q->elevator))
Damien Le Moal954b4a52019-09-05 18:51:30 +0900648 return;
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200649
650 e = elevator_get(q, "mq-deadline", false);
651 if (!e)
Damien Le Moal954b4a52019-09-05 18:51:30 +0900652 return;
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200653
654 err = blk_mq_init_sched(q, e);
Damien Le Moal954b4a52019-09-05 18:51:30 +0900655 if (err) {
656 pr_warn("\"%s\" elevator initialization failed, "
657 "falling back to \"none\"\n", e->elevator_name);
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200658 elevator_put(e);
Damien Le Moal954b4a52019-09-05 18:51:30 +0900659 }
Christoph Hellwig131d08e2018-05-31 19:11:40 +0200660}
661
662
663/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664 * switch to new_e io scheduler. be careful not to introduce deadlocks -
665 * we don't free the old io scheduler, before we have allocated what we
666 * need for the new one. this way we have a chance of going back to the old
Tejun Heocb98fc82005-10-28 08:29:39 +0200667 * one, if the new one fails init for some reason.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668 */
Jens Axboe165125e2007-07-24 09:28:11 +0200669static int elevator_switch(struct request_queue *q, struct elevator_type *new_e)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670{
Tejun Heoe8989fa2012-03-05 13:15:20 -0800671 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700672
Bart Van Assche14a23492018-01-17 11:48:09 -0800673 lockdep_assert_held(&q->sysfs_lock);
674
Jens Axboea1ce35f2018-10-29 10:23:51 -0600675 blk_mq_freeze_queue(q);
676 blk_mq_quiesce_queue(q);
Jianchao Wangd48ece22018-08-21 15:15:03 +0800677
Jens Axboea1ce35f2018-10-29 10:23:51 -0600678 err = elevator_switch_mq(q, new_e);
Jianchao Wangd48ece22018-08-21 15:15:03 +0800679
Jens Axboea1ce35f2018-10-29 10:23:51 -0600680 blk_mq_unquiesce_queue(q);
681 blk_mq_unfreeze_queue(q);
Nick Piggin75ad23b2008-04-29 14:48:33 +0200682
Jens Axboe5dd531a2010-08-23 13:52:19 +0200683 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684}
685
Jens Axboe5dd531a2010-08-23 13:52:19 +0200686/*
687 * Switch this queue to the given IO scheduler.
688 */
Tomoki Sekiyama7c8a3672013-10-15 16:42:19 -0600689static int __elevator_change(struct request_queue *q, const char *name)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700690{
691 char elevator_name[ELV_NAME_MAX];
692 struct elevator_type *e;
693
David Jefferye9a823f2017-08-28 10:52:44 -0600694 /* Make sure queue is not in the middle of being removed */
Ming Lei58c898b2019-08-27 19:01:47 +0800695 if (!blk_queue_registered(q))
David Jefferye9a823f2017-08-28 10:52:44 -0600696 return -ENOENT;
697
Jens Axboebd166ef2017-01-17 06:03:22 -0700698 /*
699 * Special case for mq, turn off scheduling
700 */
Aleksei Zakharovfbd72122019-02-11 13:50:37 +0300701 if (!strncmp(name, "none", 4)) {
702 if (!q->elevator)
703 return 0;
Jens Axboebd166ef2017-01-17 06:03:22 -0700704 return elevator_switch(q, NULL);
Aleksei Zakharovfbd72122019-02-11 13:50:37 +0300705 }
Martin K. Petersencd43e262009-05-22 17:17:52 -0400706
Li Zefanee2e9922008-10-14 08:49:56 +0200707 strlcpy(elevator_name, name, sizeof(elevator_name));
Jens Axboe2527d992017-10-25 12:33:42 -0600708 e = elevator_get(q, strstrip(elevator_name), true);
Jens Axboe340ff322017-05-10 07:40:04 -0600709 if (!e)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711
Jens Axboe8ac0d9a2017-10-25 12:35:02 -0600712 if (q->elevator && elevator_match(q->elevator->type, elevator_name)) {
Nate Diller2ca7d932005-10-30 15:02:24 -0800713 elevator_put(e);
Jens Axboe5dd531a2010-08-23 13:52:19 +0200714 return 0;
Nate Diller2ca7d932005-10-30 15:02:24 -0800715 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700716
Jens Axboe5dd531a2010-08-23 13:52:19 +0200717 return elevator_switch(q, e);
718}
Tomoki Sekiyama7c8a3672013-10-15 16:42:19 -0600719
Jens Axboe5dd531a2010-08-23 13:52:19 +0200720ssize_t elv_iosched_store(struct request_queue *q, const char *name,
721 size_t count)
722{
723 int ret;
724
Jens Axboe344e9ff2018-11-15 12:22:51 -0700725 if (!queue_is_mq(q) || !elv_support_iosched(q))
Jens Axboe5dd531a2010-08-23 13:52:19 +0200726 return count;
727
Tomoki Sekiyama7c8a3672013-10-15 16:42:19 -0600728 ret = __elevator_change(q, name);
Jens Axboe5dd531a2010-08-23 13:52:19 +0200729 if (!ret)
730 return count;
731
Jens Axboe5dd531a2010-08-23 13:52:19 +0200732 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733}
734
Jens Axboe165125e2007-07-24 09:28:11 +0200735ssize_t elv_iosched_show(struct request_queue *q, char *name)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736{
Jens Axboeb374d182008-10-31 10:05:07 +0100737 struct elevator_queue *e = q->elevator;
Jens Axboebd166ef2017-01-17 06:03:22 -0700738 struct elevator_type *elv = NULL;
Matthias Kaehlcke70cee262007-07-10 12:26:24 +0200739 struct elevator_type *__e;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700740 int len = 0;
741
Jens Axboe344e9ff2018-11-15 12:22:51 -0700742 if (!queue_is_mq(q))
Martin K. Petersencd43e262009-05-22 17:17:52 -0400743 return sprintf(name, "none\n");
744
Jens Axboebd166ef2017-01-17 06:03:22 -0700745 if (!q->elevator)
746 len += sprintf(name+len, "[none] ");
747 else
748 elv = e->type;
Martin K. Petersencd43e262009-05-22 17:17:52 -0400749
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200750 spin_lock(&elv_list_lock);
Matthias Kaehlcke70cee262007-07-10 12:26:24 +0200751 list_for_each_entry(__e, &elv_list, list) {
Jens Axboea1ce35f2018-10-29 10:23:51 -0600752 if (elv && elevator_match(elv, __e->elevator_name)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753 len += sprintf(name+len, "[%s] ", elv->elevator_name);
Jens Axboebd166ef2017-01-17 06:03:22 -0700754 continue;
755 }
Jens Axboea1ce35f2018-10-29 10:23:51 -0600756 if (elv_support_iosched(q))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700757 len += sprintf(name+len, "%s ", __e->elevator_name);
758 }
Jens Axboe2a12dcd2007-04-26 14:41:53 +0200759 spin_unlock(&elv_list_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760
Jens Axboe344e9ff2018-11-15 12:22:51 -0700761 if (q->elevator)
Jens Axboebd166ef2017-01-17 06:03:22 -0700762 len += sprintf(name+len, "none");
763
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764 len += sprintf(len+name, "\n");
765 return len;
766}
767
Jens Axboe165125e2007-07-24 09:28:11 +0200768struct request *elv_rb_former_request(struct request_queue *q,
769 struct request *rq)
Jens Axboe2e662b62006-07-13 11:55:04 +0200770{
771 struct rb_node *rbprev = rb_prev(&rq->rb_node);
772
773 if (rbprev)
774 return rb_entry_rq(rbprev);
775
776 return NULL;
777}
Jens Axboe2e662b62006-07-13 11:55:04 +0200778EXPORT_SYMBOL(elv_rb_former_request);
779
Jens Axboe165125e2007-07-24 09:28:11 +0200780struct request *elv_rb_latter_request(struct request_queue *q,
781 struct request *rq)
Jens Axboe2e662b62006-07-13 11:55:04 +0200782{
783 struct rb_node *rbnext = rb_next(&rq->rb_node);
784
785 if (rbnext)
786 return rb_entry_rq(rbnext);
787
788 return NULL;
789}
Jens Axboe2e662b62006-07-13 11:55:04 +0200790EXPORT_SYMBOL(elv_rb_latter_request);