Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 2 | #ifndef INT_BLK_MQ_H |
| 3 | #define INT_BLK_MQ_H |
| 4 | |
Jens Axboe | cf43e6b | 2016-11-07 21:32:37 -0700 | [diff] [blame] | 5 | #include "blk-stat.h" |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 6 | #include "blk-mq-tag.h" |
Jens Axboe | cf43e6b | 2016-11-07 21:32:37 -0700 | [diff] [blame] | 7 | |
Christoph Hellwig | 24d2f90 | 2014-04-15 14:14:00 -0600 | [diff] [blame] | 8 | struct blk_mq_tag_set; |
| 9 | |
Ming Lei | 1db4909 | 2018-11-20 09:44:35 +0800 | [diff] [blame] | 10 | struct blk_mq_ctxs { |
| 11 | struct kobject kobj; |
| 12 | struct blk_mq_ctx __percpu *queue_ctx; |
| 13 | }; |
| 14 | |
Linus Walleij | fe64407 | 2018-04-20 10:29:51 +0200 | [diff] [blame] | 15 | /** |
| 16 | * struct blk_mq_ctx - State for a software queue facing the submitting CPUs |
| 17 | */ |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 18 | struct blk_mq_ctx { |
| 19 | struct { |
| 20 | spinlock_t lock; |
Ming Lei | c16d6b5 | 2018-12-17 08:44:05 -0700 | [diff] [blame] | 21 | struct list_head rq_lists[HCTX_MAX_TYPES]; |
| 22 | } ____cacheline_aligned_in_smp; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 23 | |
| 24 | unsigned int cpu; |
Jens Axboe | f31967f | 2018-10-29 13:13:29 -0600 | [diff] [blame] | 25 | unsigned short index_hw[HCTX_MAX_TYPES]; |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 26 | struct blk_mq_hw_ctx *hctxs[HCTX_MAX_TYPES]; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 27 | |
| 28 | /* incremented at dispatch time */ |
| 29 | unsigned long rq_dispatched[2]; |
| 30 | unsigned long rq_merged; |
| 31 | |
| 32 | /* incremented at completion time */ |
| 33 | unsigned long ____cacheline_aligned_in_smp rq_completed[2]; |
| 34 | |
| 35 | struct request_queue *queue; |
Ming Lei | 1db4909 | 2018-11-20 09:44:35 +0800 | [diff] [blame] | 36 | struct blk_mq_ctxs *ctxs; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 37 | struct kobject kobj; |
Jens Axboe | 4bb659b | 2014-05-09 09:36:49 -0600 | [diff] [blame] | 38 | } ____cacheline_aligned_in_smp; |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 39 | |
Ming Lei | c7e2d94 | 2019-04-30 09:52:25 +0800 | [diff] [blame] | 40 | void blk_mq_exit_queue(struct request_queue *q); |
Jens Axboe | e3a2b3f | 2014-05-20 11:49:02 -0600 | [diff] [blame] | 41 | int blk_mq_update_nr_requests(struct request_queue *q, unsigned int nr); |
Jens Axboe | aed3ea9 | 2014-12-22 14:04:42 -0700 | [diff] [blame] | 42 | void blk_mq_wake_waiters(struct request_queue *q); |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 43 | bool blk_mq_dispatch_rq_list(struct request_queue *, struct list_head *, bool); |
Bart Van Assche | e6c9871 | 2019-03-20 13:14:37 -0700 | [diff] [blame] | 44 | void blk_mq_add_to_requeue_list(struct request *rq, bool at_head, |
| 45 | bool kick_requeue_list); |
Jens Axboe | 2c3ad66 | 2016-12-14 14:34:47 -0700 | [diff] [blame] | 46 | void blk_mq_flush_busy_ctxs(struct blk_mq_hw_ctx *hctx, struct list_head *list); |
Ming Lei | b347689 | 2017-10-14 17:22:30 +0800 | [diff] [blame] | 47 | struct request *blk_mq_dequeue_from_ctx(struct blk_mq_hw_ctx *hctx, |
| 48 | struct blk_mq_ctx *start); |
Jens Axboe | 2c3ad66 | 2016-12-14 14:34:47 -0700 | [diff] [blame] | 49 | |
| 50 | /* |
| 51 | * Internal helpers for allocating/freeing the request map |
| 52 | */ |
Jens Axboe | cc71a6f | 2017-01-11 14:29:56 -0700 | [diff] [blame] | 53 | void blk_mq_free_rqs(struct blk_mq_tag_set *set, struct blk_mq_tags *tags, |
| 54 | unsigned int hctx_idx); |
| 55 | void blk_mq_free_rq_map(struct blk_mq_tags *tags); |
| 56 | struct blk_mq_tags *blk_mq_alloc_rq_map(struct blk_mq_tag_set *set, |
| 57 | unsigned int hctx_idx, |
| 58 | unsigned int nr_tags, |
| 59 | unsigned int reserved_tags); |
| 60 | int blk_mq_alloc_rqs(struct blk_mq_tag_set *set, struct blk_mq_tags *tags, |
| 61 | unsigned int hctx_idx, unsigned int depth); |
Jens Axboe | 2c3ad66 | 2016-12-14 14:34:47 -0700 | [diff] [blame] | 62 | |
| 63 | /* |
| 64 | * Internal helpers for request insertion into sw queues |
| 65 | */ |
| 66 | void __blk_mq_insert_request(struct blk_mq_hw_ctx *hctx, struct request *rq, |
| 67 | bool at_head); |
Ming Lei | 01e99ae | 2020-02-25 09:04:32 +0800 | [diff] [blame] | 68 | void blk_mq_request_bypass_insert(struct request *rq, bool at_head, |
| 69 | bool run_queue); |
Jens Axboe | bd166ef | 2017-01-17 06:03:22 -0700 | [diff] [blame] | 70 | void blk_mq_insert_requests(struct blk_mq_hw_ctx *hctx, struct blk_mq_ctx *ctx, |
| 71 | struct list_head *list); |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 72 | |
Bart Van Assche | fd9c40f | 2019-04-04 10:08:43 -0700 | [diff] [blame] | 73 | /* Used by blk_insert_cloned_request() to issue request directly */ |
| 74 | blk_status_t blk_mq_request_issue_directly(struct request *rq, bool last); |
Ming Lei | 6ce3dd6 | 2018-07-10 09:03:31 +0800 | [diff] [blame] | 75 | void blk_mq_try_issue_list_directly(struct blk_mq_hw_ctx *hctx, |
| 76 | struct list_head *list); |
Ming Lei | 396eaf2 | 2018-01-17 11:25:57 -0500 | [diff] [blame] | 77 | |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 78 | /* |
| 79 | * CPU -> queue mappings |
| 80 | */ |
Jens Axboe | ed76e32 | 2018-10-29 13:06:14 -0600 | [diff] [blame] | 81 | extern int blk_mq_hw_queue_to_node(struct blk_mq_queue_map *qmap, unsigned int); |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 82 | |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 83 | /* |
| 84 | * blk_mq_map_queue_type() - map (hctx_type,cpu) to hardware queue |
| 85 | * @q: request queue |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 86 | * @type: the hctx type index |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 87 | * @cpu: CPU |
| 88 | */ |
Jens Axboe | ff2c566 | 2018-10-29 13:07:33 -0600 | [diff] [blame] | 89 | static inline struct blk_mq_hw_ctx *blk_mq_map_queue_type(struct request_queue *q, |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 90 | enum hctx_type type, |
Jens Axboe | ff2c566 | 2018-10-29 13:07:33 -0600 | [diff] [blame] | 91 | unsigned int cpu) |
| 92 | { |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 93 | return q->queue_hw_ctx[q->tag_set->map[type].mq_map[cpu]]; |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 94 | } |
| 95 | |
| 96 | /* |
| 97 | * blk_mq_map_queue() - map (cmd_flags,type) to hardware queue |
| 98 | * @q: request queue |
| 99 | * @flags: request command flags |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 100 | * @cpu: cpu ctx |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 101 | */ |
| 102 | static inline struct blk_mq_hw_ctx *blk_mq_map_queue(struct request_queue *q, |
| 103 | unsigned int flags, |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 104 | struct blk_mq_ctx *ctx) |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 105 | { |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 106 | enum hctx_type type = HCTX_TYPE_DEFAULT; |
Jens Axboe | b3c661b | 2018-10-30 10:36:06 -0600 | [diff] [blame] | 107 | |
Jianchao Wang | bb94aea | 2019-01-24 18:25:33 +0800 | [diff] [blame] | 108 | /* |
| 109 | * The caller ensure that if REQ_HIPRI, poll must be enabled. |
| 110 | */ |
| 111 | if (flags & REQ_HIPRI) |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 112 | type = HCTX_TYPE_POLL; |
Jianchao Wang | bb94aea | 2019-01-24 18:25:33 +0800 | [diff] [blame] | 113 | else if ((flags & REQ_OP_MASK) == REQ_OP_READ) |
Christoph Hellwig | e20ba6e | 2018-12-02 17:46:16 +0100 | [diff] [blame] | 114 | type = HCTX_TYPE_READ; |
Christoph Hellwig | 5aceaeb | 2018-12-17 12:16:26 +0100 | [diff] [blame] | 115 | |
Jianchao Wang | 8ccdf4a | 2019-01-24 18:25:32 +0800 | [diff] [blame] | 116 | return ctx->hctxs[type]; |
Jens Axboe | ff2c566 | 2018-10-29 13:07:33 -0600 | [diff] [blame] | 117 | } |
| 118 | |
Jens Axboe | e93ecf6 | 2014-05-19 09:17:48 -0600 | [diff] [blame] | 119 | /* |
Jens Axboe | 67aec14 | 2014-05-30 08:25:36 -0600 | [diff] [blame] | 120 | * sysfs helpers |
| 121 | */ |
Ming Lei | 737f98c | 2017-02-22 18:13:59 +0800 | [diff] [blame] | 122 | extern void blk_mq_sysfs_init(struct request_queue *q); |
Ming Lei | 7ea5fe3 | 2017-02-22 18:14:00 +0800 | [diff] [blame] | 123 | extern void blk_mq_sysfs_deinit(struct request_queue *q); |
Bart Van Assche | 2d0364c | 2017-04-26 13:47:48 -0700 | [diff] [blame] | 124 | extern int __blk_mq_register_dev(struct device *dev, struct request_queue *q); |
Jens Axboe | 67aec14 | 2014-05-30 08:25:36 -0600 | [diff] [blame] | 125 | extern int blk_mq_sysfs_register(struct request_queue *q); |
| 126 | extern void blk_mq_sysfs_unregister(struct request_queue *q); |
Keith Busch | 868f2f0 | 2015-12-17 17:08:14 -0700 | [diff] [blame] | 127 | extern void blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx *hctx); |
Jens Axboe | 67aec14 | 2014-05-30 08:25:36 -0600 | [diff] [blame] | 128 | |
Ming Lei | e09aae7 | 2015-01-29 20:17:27 +0800 | [diff] [blame] | 129 | void blk_mq_release(struct request_queue *q); |
| 130 | |
Ming Lei | 1aecfe4 | 2014-06-01 00:43:36 +0800 | [diff] [blame] | 131 | static inline struct blk_mq_ctx *__blk_mq_get_ctx(struct request_queue *q, |
| 132 | unsigned int cpu) |
| 133 | { |
| 134 | return per_cpu_ptr(q->queue_ctx, cpu); |
| 135 | } |
| 136 | |
| 137 | /* |
| 138 | * This assumes per-cpu software queueing queues. They could be per-node |
| 139 | * as well, for instance. For now this is hardcoded as-is. Note that we don't |
| 140 | * care about preemption, since we know the ctx's are persistent. This does |
| 141 | * mean that we can't rely on ctx always matching the currently running CPU. |
| 142 | */ |
| 143 | static inline struct blk_mq_ctx *blk_mq_get_ctx(struct request_queue *q) |
| 144 | { |
Bart Van Assche | c05f422 | 2019-07-01 08:47:29 -0700 | [diff] [blame] | 145 | return __blk_mq_get_ctx(q, raw_smp_processor_id()); |
Ming Lei | 1aecfe4 | 2014-06-01 00:43:36 +0800 | [diff] [blame] | 146 | } |
| 147 | |
Ming Lei | cb96a42c | 2014-06-01 00:43:37 +0800 | [diff] [blame] | 148 | struct blk_mq_alloc_data { |
| 149 | /* input parameter */ |
| 150 | struct request_queue *q; |
Bart Van Assche | 9a95e4e | 2017-11-09 10:49:59 -0800 | [diff] [blame] | 151 | blk_mq_req_flags_t flags; |
Omar Sandoval | 229a9287 | 2017-04-14 00:59:59 -0700 | [diff] [blame] | 152 | unsigned int shallow_depth; |
Jens Axboe | f9afca4 | 2018-10-29 13:11:38 -0600 | [diff] [blame] | 153 | unsigned int cmd_flags; |
Ming Lei | cb96a42c | 2014-06-01 00:43:37 +0800 | [diff] [blame] | 154 | |
| 155 | /* input & output parameter */ |
| 156 | struct blk_mq_ctx *ctx; |
| 157 | struct blk_mq_hw_ctx *hctx; |
| 158 | }; |
| 159 | |
Jens Axboe | 4941115 | 2017-01-13 08:09:05 -0700 | [diff] [blame] | 160 | static inline struct blk_mq_tags *blk_mq_tags_from_data(struct blk_mq_alloc_data *data) |
| 161 | { |
Jens Axboe | bd166ef | 2017-01-17 06:03:22 -0700 | [diff] [blame] | 162 | if (data->flags & BLK_MQ_REQ_INTERNAL) |
| 163 | return data->hctx->sched_tags; |
| 164 | |
Jens Axboe | 4941115 | 2017-01-13 08:09:05 -0700 | [diff] [blame] | 165 | return data->hctx->tags; |
| 166 | } |
| 167 | |
Bart Van Assche | 5d1b25c | 2016-10-28 17:19:15 -0700 | [diff] [blame] | 168 | static inline bool blk_mq_hctx_stopped(struct blk_mq_hw_ctx *hctx) |
| 169 | { |
| 170 | return test_bit(BLK_MQ_S_STOPPED, &hctx->state); |
| 171 | } |
| 172 | |
Ming Lei | 19c66e5 | 2014-12-03 19:38:04 +0800 | [diff] [blame] | 173 | static inline bool blk_mq_hw_queue_mapped(struct blk_mq_hw_ctx *hctx) |
| 174 | { |
| 175 | return hctx->nr_ctx && hctx->tags; |
| 176 | } |
| 177 | |
Mikulas Patocka | e016b78 | 2018-12-06 11:41:21 -0500 | [diff] [blame] | 178 | unsigned int blk_mq_in_flight(struct request_queue *q, struct hd_struct *part); |
Omar Sandoval | bf0ddab | 2018-04-26 00:21:59 -0700 | [diff] [blame] | 179 | void blk_mq_in_flight_rw(struct request_queue *q, struct hd_struct *part, |
| 180 | unsigned int inflight[2]); |
Jens Axboe | f299b7c | 2017-08-08 17:51:45 -0600 | [diff] [blame] | 181 | |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 182 | static inline void blk_mq_put_dispatch_budget(struct blk_mq_hw_ctx *hctx) |
| 183 | { |
| 184 | struct request_queue *q = hctx->queue; |
| 185 | |
| 186 | if (q->mq_ops->put_budget) |
| 187 | q->mq_ops->put_budget(hctx); |
| 188 | } |
| 189 | |
Ming Lei | 88022d7 | 2017-11-05 02:21:12 +0800 | [diff] [blame] | 190 | static inline bool blk_mq_get_dispatch_budget(struct blk_mq_hw_ctx *hctx) |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 191 | { |
| 192 | struct request_queue *q = hctx->queue; |
| 193 | |
| 194 | if (q->mq_ops->get_budget) |
| 195 | return q->mq_ops->get_budget(hctx); |
Ming Lei | 88022d7 | 2017-11-05 02:21:12 +0800 | [diff] [blame] | 196 | return true; |
Ming Lei | de14829 | 2017-10-14 17:22:29 +0800 | [diff] [blame] | 197 | } |
| 198 | |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 199 | static inline void __blk_mq_put_driver_tag(struct blk_mq_hw_ctx *hctx, |
| 200 | struct request *rq) |
| 201 | { |
John Garry | cae740a | 2020-02-26 20:10:15 +0800 | [diff] [blame] | 202 | blk_mq_put_tag(hctx->tags, rq->mq_ctx, rq->tag); |
Christoph Hellwig | 76647368 | 2020-05-29 15:53:12 +0200 | [diff] [blame] | 203 | rq->tag = BLK_MQ_NO_TAG; |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 204 | |
| 205 | if (rq->rq_flags & RQF_MQ_INFLIGHT) { |
| 206 | rq->rq_flags &= ~RQF_MQ_INFLIGHT; |
| 207 | atomic_dec(&hctx->nr_active); |
| 208 | } |
| 209 | } |
| 210 | |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 211 | static inline void blk_mq_put_driver_tag(struct request *rq) |
| 212 | { |
Christoph Hellwig | 76647368 | 2020-05-29 15:53:12 +0200 | [diff] [blame] | 213 | if (rq->tag == BLK_MQ_NO_TAG || rq->internal_tag == BLK_MQ_NO_TAG) |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 214 | return; |
| 215 | |
Jens Axboe | ea4f995 | 2018-10-29 15:06:13 -0600 | [diff] [blame] | 216 | __blk_mq_put_driver_tag(rq->mq_hctx, rq); |
Ming Lei | 244c65a | 2017-11-04 12:39:57 -0600 | [diff] [blame] | 217 | } |
| 218 | |
Jens Axboe | ed76e32 | 2018-10-29 13:06:14 -0600 | [diff] [blame] | 219 | static inline void blk_mq_clear_mq_map(struct blk_mq_queue_map *qmap) |
Minwoo Im | 0da73d0 | 2018-07-02 23:46:43 +0900 | [diff] [blame] | 220 | { |
| 221 | int cpu; |
| 222 | |
| 223 | for_each_possible_cpu(cpu) |
Jens Axboe | ed76e32 | 2018-10-29 13:06:14 -0600 | [diff] [blame] | 224 | qmap->mq_map[cpu] = 0; |
Minwoo Im | 0da73d0 | 2018-07-02 23:46:43 +0900 | [diff] [blame] | 225 | } |
| 226 | |
Damien Le Moal | b49773e7 | 2019-07-11 01:18:31 +0900 | [diff] [blame] | 227 | /* |
| 228 | * blk_mq_plug() - Get caller context plug |
| 229 | * @q: request queue |
| 230 | * @bio : the bio being submitted by the caller context |
| 231 | * |
| 232 | * Plugging, by design, may delay the insertion of BIOs into the elevator in |
| 233 | * order to increase BIO merging opportunities. This however can cause BIO |
| 234 | * insertion order to change from the order in which submit_bio() is being |
| 235 | * executed in the case of multiple contexts concurrently issuing BIOs to a |
| 236 | * device, even if these context are synchronized to tightly control BIO issuing |
| 237 | * order. While this is not a problem with regular block devices, this ordering |
| 238 | * change can cause write BIO failures with zoned block devices as these |
| 239 | * require sequential write patterns to zones. Prevent this from happening by |
| 240 | * ignoring the plug state of a BIO issuing context if the target request queue |
| 241 | * is for a zoned block device and the BIO to plug is a write operation. |
| 242 | * |
| 243 | * Return current->plug if the bio can be plugged and NULL otherwise |
| 244 | */ |
| 245 | static inline struct blk_plug *blk_mq_plug(struct request_queue *q, |
| 246 | struct bio *bio) |
| 247 | { |
| 248 | /* |
| 249 | * For regular block devices or read operations, use the context plug |
| 250 | * which may be NULL if blk_start_plug() was not executed. |
| 251 | */ |
| 252 | if (!blk_queue_is_zoned(q) || !op_is_write(bio_op(bio))) |
| 253 | return current->plug; |
| 254 | |
| 255 | /* Zoned block device write operation case: do not plug the BIO */ |
| 256 | return NULL; |
| 257 | } |
| 258 | |
Jens Axboe | 320ae51 | 2013-10-24 09:20:05 +0100 | [diff] [blame] | 259 | #endif |