Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 2 | #ifndef INT_BLK_MQ_H |
| 3 | #define INT_BLK_MQ_H |
| 4 | |
Jens Axboe | cf43e6b | 2016-11-07 21:32:37 -0700 | [diff] [blame] | 5 | #include "blk-stat.h" |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 6 | #include "blk-mq-tag.h" |
Jens Axboe | cf43e6b | 2016-11-07 21:32:37 -0700 | [diff] [blame] | 7 | |
Christoph Hellwig | 24d2f90 | 2014-04-15 14:14:00 -0600 | [diff] [blame] | 8 | struct blk_mq_tag_set; |
| 9 | |
Ming Lei | 1db4909 | 2018-11-20 09:44:35 +0800 | [diff] [blame] | 10 | struct blk_mq_ctxs { |
| 11 | struct kobject kobj; |
| 12 | struct blk_mq_ctx __percpu *queue_ctx; |
| 13 | }; |
| 14 | |
Linus Walleij | fe64407 | 2018-04-20 10:29:51 +0200 | [diff] [blame] | 15 | /** |
| 16 | * struct blk_mq_ctx - State for a software queue facing the submitting CPUs |
| 17 | */ |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 18 | struct blk_mq_ctx { |
| 19 | struct { |
| 20 | spinlock_t lock; |
Ming Lei | c16d6b5 | 2018-12-17 08:44:05 -0700 | [diff] [blame] | 21 | struct list_head rq_lists[HCTX_MAX_TYPES]; |
| 22 | } ____cacheline_aligned_in_smp; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 23 | |
| 24 | unsigned int cpu; |
Jens Axboe | f31967f | 2018-10-29 13:13:29 -0600 | [diff] [blame] | 25 | unsigned short index_hw[HCTX_MAX_TYPES]; |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 26 | struct blk_mq_hw_ctx *hctxs[HCTX_MAX_TYPES]; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 27 | |
| 28 | /* incremented at dispatch time */ |
| 29 | unsigned long rq_dispatched[2]; |
| 30 | unsigned long rq_merged; |
| 31 | |
| 32 | /* incremented at completion time */ |
| 33 | unsigned long ____cacheline_aligned_in_smp rq_completed[2]; |
| 34 | |
| 35 | struct request_queue *queue; |
Ming Lei | 1db4909 | 2018-11-20 09:44:35 +0800 | [diff] [blame] | 36 | struct blk_mq_ctxs *ctxs; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 37 | struct kobject kobj; |
Jens Axboe | 4bb659b | 2014-05-09 09:36:49 -0600 | [diff] [blame] | 38 | } ____cacheline_aligned_in_smp; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 39 | |
Ming Lei | c7e2d94 | 2019-04-30 09:52:25 +0800 | [diff] [blame] | 40 | void blk_mq_exit_queue(struct request_queue *q); |
Jens Axboe | e3a2b3f | 2014-05-20 11:49:02 -0600 | [diff] [blame] | 41 | int blk_mq_update_nr_requests(struct request_queue *q, unsigned int nr); |
Jens Axboe | aed3ea9 | 2014-12-22 14:04:42 -0700 | [diff] [blame] | 42 | void blk_mq_wake_waiters(struct request_queue *q); |
Ming Lei | 1fd40b5 | 2020-06-30 18:25:00 +0800 | [diff] [blame] | 43 | bool blk_mq_dispatch_rq_list(struct blk_mq_hw_ctx *hctx, struct list_head *, |
| 44 | unsigned int); |
Bart Van Assche | e6c9871 | 2019-03-20 13:14:37 -0700 | [diff] [blame] | 45 | void blk_mq_add_to_requeue_list(struct request *rq, bool at_head, |
| 46 | bool kick_requeue_list); |
Jens Axboe | 2c3ad66 | 2016-12-14 14:34:47 -0700 | [diff] [blame] | 47 | void blk_mq_flush_busy_ctxs(struct blk_mq_hw_ctx *hctx, struct list_head *list); |
Ming Lei | b347689 | 2017-10-14 17:22:30 +0800 | [diff] [blame] | 48 | struct request *blk_mq_dequeue_from_ctx(struct blk_mq_hw_ctx *hctx, |
| 49 | struct blk_mq_ctx *start); |
Jens Axboe | 2c3ad66 | 2016-12-14 14:34:47 -0700 | [diff] [blame] | 50 | |
| 51 | /* |
| 52 | * Internal helpers for allocating/freeing the request map |
| 53 | */ |
Jens Axboe | cc71a6f | 2017-01-11 14:29:56 -0700 | [diff] [blame] | 54 | void blk_mq_free_rqs(struct blk_mq_tag_set *set, struct blk_mq_tags *tags, |
| 55 | unsigned int hctx_idx); |
| 56 | void blk_mq_free_rq_map(struct blk_mq_tags *tags); |
| 57 | struct blk_mq_tags *blk_mq_alloc_rq_map(struct blk_mq_tag_set *set, |
| 58 | unsigned int hctx_idx, |
| 59 | unsigned int nr_tags, |
| 60 | unsigned int reserved_tags); |
| 61 | int blk_mq_alloc_rqs(struct blk_mq_tag_set *set, struct blk_mq_tags *tags, |
| 62 | unsigned int hctx_idx, unsigned int depth); |
Jens Axboe | 2c3ad66 | 2016-12-14 14:34:47 -0700 | [diff] [blame] | 63 | |
| 64 | /* |
| 65 | * Internal helpers for request insertion into sw queues |
| 66 | */ |
| 67 | void __blk_mq_insert_request(struct blk_mq_hw_ctx *hctx, struct request *rq, |
| 68 | bool at_head); |
Ming Lei | 01e99ae | 2020-02-25 09:04:32 +0800 | [diff] [blame] | 69 | void blk_mq_request_bypass_insert(struct request *rq, bool at_head, |
| 70 | bool run_queue); |
Jens Axboe | bd166ef | 2017-01-17 06:03:22 -0700 | [diff] [blame] | 71 | void blk_mq_insert_requests(struct blk_mq_hw_ctx *hctx, struct blk_mq_ctx *ctx, |
| 72 | struct list_head *list); |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 73 | |
Bart Van Assche | fd9c40f | 2019-04-04 10:08:43 -0700 | [diff] [blame] | 74 | /* Used by blk_insert_cloned_request() to issue request directly */ |
| 75 | blk_status_t blk_mq_request_issue_directly(struct request *rq, bool last); |
Ming Lei | 6ce3dd6 | 2018-07-10 09:03:31 +0800 | [diff] [blame] | 76 | void blk_mq_try_issue_list_directly(struct blk_mq_hw_ctx *hctx, |
| 77 | struct list_head *list); |
Ming Lei | 396eaf2 | 2018-01-17 11:25:57 -0500 | [diff] [blame] | 78 | |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 79 | /* |
| 80 | * CPU -> queue mappings |
| 81 | */ |
Jens Axboe | ed76e32 | 2018-10-29 13:06:14 -0600 | [diff] [blame] | 82 | extern int blk_mq_hw_queue_to_node(struct blk_mq_queue_map *qmap, unsigned int); |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 83 | |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 84 | /* |
| 85 | * blk_mq_map_queue_type() - map (hctx_type,cpu) to hardware queue |
| 86 | * @q: request queue |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 87 | * @type: the hctx type index |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 88 | * @cpu: CPU |
| 89 | */ |
Jens Axboe | ff2c566 | 2018-10-29 13:07:33 -0600 | [diff] [blame] | 90 | static inline struct blk_mq_hw_ctx *blk_mq_map_queue_type(struct request_queue *q, |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 91 | enum hctx_type type, |
Jens Axboe | ff2c566 | 2018-10-29 13:07:33 -0600 | [diff] [blame] | 92 | unsigned int cpu) |
| 93 | { |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 94 | return q->queue_hw_ctx[q->tag_set->map[type].mq_map[cpu]]; |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 95 | } |
| 96 | |
| 97 | /* |
| 98 | * blk_mq_map_queue() - map (cmd_flags,type) to hardware queue |
| 99 | * @q: request queue |
| 100 | * @flags: request command flags |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 101 | * @cpu: cpu ctx |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 102 | */ |
| 103 | static inline struct blk_mq_hw_ctx *blk_mq_map_queue(struct request_queue *q, |
| 104 | unsigned int flags, |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 105 | struct blk_mq_ctx *ctx) |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 106 | { |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 107 | enum hctx_type type = HCTX_TYPE_DEFAULT; |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 108 | |
Jianchao Wang | bb94aea | 2019-01-24 18:25:33 +0800 | [diff] [blame] | 109 | /* |
| 110 | * The caller ensure that if REQ_HIPRI, poll must be enabled. |
| 111 | */ |
| 112 | if (flags & REQ_HIPRI) |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 113 | type = HCTX_TYPE_POLL; |
Jianchao Wang | bb94aea | 2019-01-24 18:25:33 +0800 | [diff] [blame] | 114 | else if ((flags & REQ_OP_MASK) == REQ_OP_READ) |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 115 | type = HCTX_TYPE_READ; |
Christoph Hellwig | 5aceaeb | 2018-12-17 12:16:26 +0100 | [diff] [blame] | 116 | |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 117 | return ctx->hctxs[type]; |
Jens Axboe | ff2c566 | 2018-10-29 13:07:33 -0600 | [diff] [blame] | 118 | } |
| 119 | |
Jens Axboe | e93ecf6 | 2014-05-19 09:17:48 -0600 | [diff] [blame] | 120 | /* |
Jens Axboe | 67aec14 | 2014-05-30 08:25:36 -0600 | [diff] [blame] | 121 | * sysfs helpers |
| 122 | */ |
Ming Lei | 737f98c | 2017-02-22 18:13:59 +0800 | [diff] [blame] | 123 | extern void blk_mq_sysfs_init(struct request_queue *q); |
Ming Lei | 7ea5fe3 | 2017-02-22 18:14:00 +0800 | [diff] [blame] | 124 | extern void blk_mq_sysfs_deinit(struct request_queue *q); |
Bart Van Assche | 2d0364c | 2017-04-26 13:47:48 -0700 | [diff] [blame] | 125 | extern int __blk_mq_register_dev(struct device *dev, struct request_queue *q); |
Jens Axboe | 67aec14 | 2014-05-30 08:25:36 -0600 | [diff] [blame] | 126 | extern int blk_mq_sysfs_register(struct request_queue *q); |
| 127 | extern void blk_mq_sysfs_unregister(struct request_queue *q); |
Keith Busch | 868f2f0 | 2015-12-17 17:08:14 -0700 | [diff] [blame] | 128 | extern void blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx *hctx); |
Jens Axboe | 67aec14 | 2014-05-30 08:25:36 -0600 | [diff] [blame] | 129 | |
Ming Lei | e09aae7 | 2015-01-29 20:17:27 +0800 | [diff] [blame] | 130 | void blk_mq_release(struct request_queue *q); |
| 131 | |
Ming Lei | 1aecfe4 | 2014-06-01 00:43:36 +0800 | [diff] [blame] | 132 | static inline struct blk_mq_ctx *__blk_mq_get_ctx(struct request_queue *q, |
| 133 | unsigned int cpu) |
| 134 | { |
| 135 | return per_cpu_ptr(q->queue_ctx, cpu); |
| 136 | } |
| 137 | |
| 138 | /* |
| 139 | * This assumes per-cpu software queueing queues. They could be per-node |
| 140 | * as well, for instance. For now this is hardcoded as-is. Note that we don't |
| 141 | * care about preemption, since we know the ctx's are persistent. This does |
| 142 | * mean that we can't rely on ctx always matching the currently running CPU. |
| 143 | */ |
| 144 | static inline struct blk_mq_ctx *blk_mq_get_ctx(struct request_queue *q) |
| 145 | { |
Bart Van Assche | c05f422 | 2019-07-01 08:47:29 -0700 | [diff] [blame] | 146 | return __blk_mq_get_ctx(q, raw_smp_processor_id()); |
Ming Lei | 1aecfe4 | 2014-06-01 00:43:36 +0800 | [diff] [blame] | 147 | } |
| 148 | |
Ming Lei | cb96a42c | 2014-06-01 00:43:37 +0800 | [diff] [blame] | 149 | struct blk_mq_alloc_data { |
| 150 | /* input parameter */ |
| 151 | struct request_queue *q; |
Bart Van Assche | 9a95e4e | 2017-11-09 10:49:59 -0800 | [diff] [blame] | 152 | blk_mq_req_flags_t flags; |
Omar Sandoval | 229a9287 | 2017-04-14 00:59:59 -0700 | [diff] [blame] | 153 | unsigned int shallow_depth; |
Jens Axboe | f9afca4 | 2018-10-29 13:11:38 -0600 | [diff] [blame] | 154 | unsigned int cmd_flags; |
Ming Lei | cb96a42c | 2014-06-01 00:43:37 +0800 | [diff] [blame] | 155 | |
| 156 | /* input & output parameter */ |
| 157 | struct blk_mq_ctx *ctx; |
| 158 | struct blk_mq_hw_ctx *hctx; |
| 159 | }; |
| 160 | |
Jens Axboe | 4941115 | 2017-01-13 08:09:05 -0700 | [diff] [blame] | 161 | static inline struct blk_mq_tags *blk_mq_tags_from_data(struct blk_mq_alloc_data *data) |
| 162 | { |
Christoph Hellwig | 42fdc5e | 2020-06-29 17:08:34 +0200 | [diff] [blame] | 163 | if (data->q->elevator) |
Jens Axboe | bd166ef | 2017-01-17 06:03:22 -0700 | [diff] [blame] | 164 | return data->hctx->sched_tags; |
| 165 | |
Jens Axboe | 4941115 | 2017-01-13 08:09:05 -0700 | [diff] [blame] | 166 | return data->hctx->tags; |
| 167 | } |
| 168 | |
Bart Van Assche | 5d1b25c | 2016-10-28 17:19:15 -0700 | [diff] [blame] | 169 | static inline bool blk_mq_hctx_stopped(struct blk_mq_hw_ctx *hctx) |
| 170 | { |
| 171 | return test_bit(BLK_MQ_S_STOPPED, &hctx->state); |
| 172 | } |
| 173 | |
Ming Lei | 19c66e5 | 2014-12-03 19:38:04 +0800 | [diff] [blame] | 174 | static inline bool blk_mq_hw_queue_mapped(struct blk_mq_hw_ctx *hctx) |
| 175 | { |
| 176 | return hctx->nr_ctx && hctx->tags; |
| 177 | } |
| 178 | |
Mikulas Patocka | e016b78 | 2018-12-06 11:41:21 -0500 | [diff] [blame] | 179 | unsigned int blk_mq_in_flight(struct request_queue *q, struct hd_struct *part); |
Omar Sandoval | bf0ddab | 2018-04-26 00:21:59 -0700 | [diff] [blame] | 180 | void blk_mq_in_flight_rw(struct request_queue *q, struct hd_struct *part, |
| 181 | unsigned int inflight[2]); |
Jens Axboe | f299b7c | 2017-08-08 17:51:45 -0600 | [diff] [blame] | 182 | |
Ming Lei | 65c7636 | 2020-06-30 18:24:56 +0800 | [diff] [blame] | 183 | static inline void blk_mq_put_dispatch_budget(struct request_queue *q) |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 184 | { |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 185 | if (q->mq_ops->put_budget) |
Ming Lei | 65c7636 | 2020-06-30 18:24:56 +0800 | [diff] [blame] | 186 | q->mq_ops->put_budget(q); |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 187 | } |
| 188 | |
Ming Lei | 65c7636 | 2020-06-30 18:24:56 +0800 | [diff] [blame] | 189 | static inline bool blk_mq_get_dispatch_budget(struct request_queue *q) |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 190 | { |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 191 | if (q->mq_ops->get_budget) |
Ming Lei | 65c7636 | 2020-06-30 18:24:56 +0800 | [diff] [blame] | 192 | return q->mq_ops->get_budget(q); |
Ming Lei | 88022d7 | 2017-11-05 02:21:12 +0800 | [diff] [blame] | 193 | return true; |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 194 | } |
| 195 | |
Jens Axboe | 4e2f62e5 | 2020-07-01 22:58:32 -0600 | [diff] [blame] | 196 | static inline void __blk_mq_put_driver_tag(struct blk_mq_hw_ctx *hctx, |
| 197 | struct request *rq) |
| 198 | { |
| 199 | blk_mq_put_tag(hctx->tags, rq->mq_ctx, rq->tag); |
| 200 | rq->tag = BLK_MQ_NO_TAG; |
| 201 | |
| 202 | if (rq->rq_flags & RQF_MQ_INFLIGHT) { |
| 203 | rq->rq_flags &= ~RQF_MQ_INFLIGHT; |
| 204 | atomic_dec(&hctx->nr_active); |
| 205 | } |
| 206 | } |
| 207 | |
| 208 | static inline void blk_mq_put_driver_tag(struct request *rq) |
| 209 | { |
| 210 | if (rq->tag == BLK_MQ_NO_TAG || rq->internal_tag == BLK_MQ_NO_TAG) |
| 211 | return; |
| 212 | |
| 213 | __blk_mq_put_driver_tag(rq->mq_hctx, rq); |
| 214 | } |
| 215 | |
Jens Axboe | ed76e32 | 2018-10-29 13:06:14 -0600 | [diff] [blame] | 216 | static inline void blk_mq_clear_mq_map(struct blk_mq_queue_map *qmap) |
Minwoo Im | 0da73d0 | 2018-07-02 23:46:43 +0900 | [diff] [blame] | 217 | { |
| 218 | int cpu; |
| 219 | |
| 220 | for_each_possible_cpu(cpu) |
Jens Axboe | ed76e32 | 2018-10-29 13:06:14 -0600 | [diff] [blame] | 221 | qmap->mq_map[cpu] = 0; |
Minwoo Im | 0da73d0 | 2018-07-02 23:46:43 +0900 | [diff] [blame] | 222 | } |
| 223 | |
Damien Le Moal | b49773e7 | 2019-07-11 01:18:31 +0900 | [diff] [blame] | 224 | /* |
| 225 | * blk_mq_plug() - Get caller context plug |
| 226 | * @q: request queue |
| 227 | * @bio : the bio being submitted by the caller context |
| 228 | * |
| 229 | * Plugging, by design, may delay the insertion of BIOs into the elevator in |
| 230 | * order to increase BIO merging opportunities. This however can cause BIO |
| 231 | * insertion order to change from the order in which submit_bio() is being |
| 232 | * executed in the case of multiple contexts concurrently issuing BIOs to a |
| 233 | * device, even if these context are synchronized to tightly control BIO issuing |
| 234 | * order. While this is not a problem with regular block devices, this ordering |
| 235 | * change can cause write BIO failures with zoned block devices as these |
| 236 | * require sequential write patterns to zones. Prevent this from happening by |
| 237 | * ignoring the plug state of a BIO issuing context if the target request queue |
| 238 | * is for a zoned block device and the BIO to plug is a write operation. |
| 239 | * |
| 240 | * Return current->plug if the bio can be plugged and NULL otherwise |
| 241 | */ |
| 242 | static inline struct blk_plug *blk_mq_plug(struct request_queue *q, |
| 243 | struct bio *bio) |
| 244 | { |
| 245 | /* |
| 246 | * For regular block devices or read operations, use the context plug |
| 247 | * which may be NULL if blk_start_plug() was not executed. |
| 248 | */ |
| 249 | if (!blk_queue_is_zoned(q) || !op_is_write(bio_op(bio))) |
| 250 | return current->plug; |
| 251 | |
| 252 | /* Zoned block device write operation case: do not plug the BIO */ |
| 253 | return NULL; |
| 254 | } |
| 255 | |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 256 | #endif |