blob: 1f8f98efd97a03ad840f6b58cf33f587b9181179 [file] [log] [blame]
Mike Snitzer4f81a412012-10-12 21:02:13 +01001/*
2 * Copyright (C) 2012 Red Hat, Inc.
3 *
4 * This file is released under the GPL.
5 */
6
7#include "dm.h"
Joe Thornber742c8fd2016-10-21 10:06:40 -04008#include "dm-bio-prison-v1.h"
9#include "dm-bio-prison-v2.h"
Mike Snitzer4f81a412012-10-12 21:02:13 +010010
11#include <linux/spinlock.h>
12#include <linux/mempool.h>
13#include <linux/module.h>
14#include <linux/slab.h>
15
16/*----------------------------------------------------------------*/
17
Joe Thornbera195db22014-10-06 16:30:06 -040018#define MIN_CELLS 1024
Heinz Mauelshagenadcc4442014-06-05 15:23:09 +010019
20struct dm_bio_prison {
Joe Thornbera195db22014-10-06 16:30:06 -040021 spinlock_t lock;
Joe Thornbera195db22014-10-06 16:30:06 -040022 struct rb_root cells;
Mike Snitzer72d711c2018-05-22 18:26:20 -040023 mempool_t cell_pool;
Mike Snitzer4f81a412012-10-12 21:02:13 +010024};
25
Mike Snitzer4f81a412012-10-12 21:02:13 +010026static struct kmem_cache *_cell_cache;
27
Joe Thornbera195db22014-10-06 16:30:06 -040028/*----------------------------------------------------------------*/
Heinz Mauelshagenadcc4442014-06-05 15:23:09 +010029
Mike Snitzer4f81a412012-10-12 21:02:13 +010030/*
31 * @nr_cells should be the number of cells you want in use _concurrently_.
32 * Don't confuse it with the number of distinct keys.
33 */
Joe Thornbera195db22014-10-06 16:30:06 -040034struct dm_bio_prison *dm_bio_prison_create(void)
Mike Snitzer4f81a412012-10-12 21:02:13 +010035{
Kent Overstreetd3775352018-06-05 05:26:33 -040036 struct dm_bio_prison *prison = kzalloc(sizeof(*prison), GFP_KERNEL);
Kent Overstreet6f1c8192018-05-20 18:25:53 -040037 int ret;
Mike Snitzer4f81a412012-10-12 21:02:13 +010038
39 if (!prison)
40 return NULL;
41
Joe Thornbera195db22014-10-06 16:30:06 -040042 spin_lock_init(&prison->lock);
43
Kent Overstreet6f1c8192018-05-20 18:25:53 -040044 ret = mempool_init_slab_pool(&prison->cell_pool, MIN_CELLS, _cell_cache);
45 if (ret) {
Mike Snitzer4f81a412012-10-12 21:02:13 +010046 kfree(prison);
47 return NULL;
48 }
49
Joe Thornbera195db22014-10-06 16:30:06 -040050 prison->cells = RB_ROOT;
Mike Snitzer4f81a412012-10-12 21:02:13 +010051
52 return prison;
53}
54EXPORT_SYMBOL_GPL(dm_bio_prison_create);
55
56void dm_bio_prison_destroy(struct dm_bio_prison *prison)
57{
Kent Overstreet6f1c8192018-05-20 18:25:53 -040058 mempool_exit(&prison->cell_pool);
Mike Snitzer4f81a412012-10-12 21:02:13 +010059 kfree(prison);
60}
61EXPORT_SYMBOL_GPL(dm_bio_prison_destroy);
62
Joe Thornber6beca5e2013-03-01 22:45:50 +000063struct dm_bio_prison_cell *dm_bio_prison_alloc_cell(struct dm_bio_prison *prison, gfp_t gfp)
64{
Kent Overstreet6f1c8192018-05-20 18:25:53 -040065 return mempool_alloc(&prison->cell_pool, gfp);
Joe Thornber6beca5e2013-03-01 22:45:50 +000066}
67EXPORT_SYMBOL_GPL(dm_bio_prison_alloc_cell);
68
69void dm_bio_prison_free_cell(struct dm_bio_prison *prison,
70 struct dm_bio_prison_cell *cell)
71{
Kent Overstreet6f1c8192018-05-20 18:25:53 -040072 mempool_free(cell, &prison->cell_pool);
Joe Thornber6beca5e2013-03-01 22:45:50 +000073}
74EXPORT_SYMBOL_GPL(dm_bio_prison_free_cell);
75
Joe Thornbera195db22014-10-06 16:30:06 -040076static void __setup_new_cell(struct dm_cell_key *key,
Joe Thornber6beca5e2013-03-01 22:45:50 +000077 struct bio *holder,
Joe Thornber6beca5e2013-03-01 22:45:50 +000078 struct dm_bio_prison_cell *cell)
Mike Snitzer4f81a412012-10-12 21:02:13 +010079{
Joe Thornbera195db22014-10-06 16:30:06 -040080 memcpy(&cell->key, key, sizeof(cell->key));
81 cell->holder = holder;
82 bio_list_init(&cell->bios);
Joe Thornber6beca5e2013-03-01 22:45:50 +000083}
Mike Snitzer4f81a412012-10-12 21:02:13 +010084
Joe Thornbera195db22014-10-06 16:30:06 -040085static int cmp_keys(struct dm_cell_key *lhs,
86 struct dm_cell_key *rhs)
87{
88 if (lhs->virtual < rhs->virtual)
89 return -1;
90
91 if (lhs->virtual > rhs->virtual)
92 return 1;
93
94 if (lhs->dev < rhs->dev)
95 return -1;
96
97 if (lhs->dev > rhs->dev)
98 return 1;
99
Joe Thornber5f274d82014-09-17 10:17:39 +0100100 if (lhs->block_end <= rhs->block_begin)
Joe Thornbera195db22014-10-06 16:30:06 -0400101 return -1;
102
Joe Thornber5f274d82014-09-17 10:17:39 +0100103 if (lhs->block_begin >= rhs->block_end)
Joe Thornbera195db22014-10-06 16:30:06 -0400104 return 1;
105
106 return 0;
107}
108
109static int __bio_detain(struct dm_bio_prison *prison,
Joe Thornber6beca5e2013-03-01 22:45:50 +0000110 struct dm_cell_key *key,
111 struct bio *inmate,
112 struct dm_bio_prison_cell *cell_prealloc,
113 struct dm_bio_prison_cell **cell_result)
114{
Joe Thornbera195db22014-10-06 16:30:06 -0400115 int r;
116 struct rb_node **new = &prison->cells.rb_node, *parent = NULL;
Mike Snitzer4f81a412012-10-12 21:02:13 +0100117
Joe Thornbera195db22014-10-06 16:30:06 -0400118 while (*new) {
119 struct dm_bio_prison_cell *cell =
Geliang Tang6e333d02017-05-06 23:39:10 +0800120 rb_entry(*new, struct dm_bio_prison_cell, node);
Joe Thornbera195db22014-10-06 16:30:06 -0400121
122 r = cmp_keys(key, &cell->key);
123
124 parent = *new;
125 if (r < 0)
126 new = &((*new)->rb_left);
127 else if (r > 0)
128 new = &((*new)->rb_right);
129 else {
130 if (inmate)
131 bio_list_add(&cell->bios, inmate);
132 *cell_result = cell;
133 return 1;
134 }
Joe Thornber6beca5e2013-03-01 22:45:50 +0000135 }
136
Joe Thornbera195db22014-10-06 16:30:06 -0400137 __setup_new_cell(key, inmate, cell_prealloc);
Joe Thornber6beca5e2013-03-01 22:45:50 +0000138 *cell_result = cell_prealloc;
Joe Thornbera195db22014-10-06 16:30:06 -0400139
140 rb_link_node(&cell_prealloc->node, parent, new);
141 rb_insert_color(&cell_prealloc->node, &prison->cells);
142
Joe Thornber6beca5e2013-03-01 22:45:50 +0000143 return 0;
144}
145
146static int bio_detain(struct dm_bio_prison *prison,
147 struct dm_cell_key *key,
148 struct bio *inmate,
149 struct dm_bio_prison_cell *cell_prealloc,
150 struct dm_bio_prison_cell **cell_result)
151{
152 int r;
Joe Thornber6beca5e2013-03-01 22:45:50 +0000153
Mikulas Patocka235bc862019-10-15 08:16:51 -0400154 spin_lock_irq(&prison->lock);
Joe Thornbera195db22014-10-06 16:30:06 -0400155 r = __bio_detain(prison, key, inmate, cell_prealloc, cell_result);
Mikulas Patocka235bc862019-10-15 08:16:51 -0400156 spin_unlock_irq(&prison->lock);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100157
Mike Snitzer4f81a412012-10-12 21:02:13 +0100158 return r;
159}
Joe Thornber6beca5e2013-03-01 22:45:50 +0000160
161int dm_bio_detain(struct dm_bio_prison *prison,
162 struct dm_cell_key *key,
163 struct bio *inmate,
164 struct dm_bio_prison_cell *cell_prealloc,
165 struct dm_bio_prison_cell **cell_result)
166{
167 return bio_detain(prison, key, inmate, cell_prealloc, cell_result);
168}
Mike Snitzer4f81a412012-10-12 21:02:13 +0100169EXPORT_SYMBOL_GPL(dm_bio_detain);
170
Joe Thornberc6b4fcb2013-03-01 22:45:51 +0000171int dm_get_cell(struct dm_bio_prison *prison,
172 struct dm_cell_key *key,
173 struct dm_bio_prison_cell *cell_prealloc,
174 struct dm_bio_prison_cell **cell_result)
175{
176 return bio_detain(prison, key, NULL, cell_prealloc, cell_result);
177}
178EXPORT_SYMBOL_GPL(dm_get_cell);
179
Mike Snitzer4f81a412012-10-12 21:02:13 +0100180/*
181 * @inmates must have been initialised prior to this call
182 */
Joe Thornbera195db22014-10-06 16:30:06 -0400183static void __cell_release(struct dm_bio_prison *prison,
184 struct dm_bio_prison_cell *cell,
Joe Thornber6beca5e2013-03-01 22:45:50 +0000185 struct bio_list *inmates)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100186{
Joe Thornbera195db22014-10-06 16:30:06 -0400187 rb_erase(&cell->node, &prison->cells);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100188
189 if (inmates) {
Joe Thornber6beca5e2013-03-01 22:45:50 +0000190 if (cell->holder)
191 bio_list_add(inmates, cell->holder);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100192 bio_list_merge(inmates, &cell->bios);
193 }
Mike Snitzer4f81a412012-10-12 21:02:13 +0100194}
195
Joe Thornber6beca5e2013-03-01 22:45:50 +0000196void dm_cell_release(struct dm_bio_prison *prison,
197 struct dm_bio_prison_cell *cell,
198 struct bio_list *bios)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100199{
Mikulas Patocka235bc862019-10-15 08:16:51 -0400200 spin_lock_irq(&prison->lock);
Joe Thornbera195db22014-10-06 16:30:06 -0400201 __cell_release(prison, cell, bios);
Mikulas Patocka235bc862019-10-15 08:16:51 -0400202 spin_unlock_irq(&prison->lock);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100203}
204EXPORT_SYMBOL_GPL(dm_cell_release);
205
206/*
Mike Snitzer4f81a412012-10-12 21:02:13 +0100207 * Sometimes we don't want the holder, just the additional bios.
208 */
Joe Thornbera195db22014-10-06 16:30:06 -0400209static void __cell_release_no_holder(struct dm_bio_prison *prison,
210 struct dm_bio_prison_cell *cell,
Joe Thornber6beca5e2013-03-01 22:45:50 +0000211 struct bio_list *inmates)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100212{
Joe Thornbera195db22014-10-06 16:30:06 -0400213 rb_erase(&cell->node, &prison->cells);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100214 bio_list_merge(inmates, &cell->bios);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100215}
216
Joe Thornber6beca5e2013-03-01 22:45:50 +0000217void dm_cell_release_no_holder(struct dm_bio_prison *prison,
218 struct dm_bio_prison_cell *cell,
219 struct bio_list *inmates)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100220{
221 unsigned long flags;
Mike Snitzer4f81a412012-10-12 21:02:13 +0100222
Joe Thornbera195db22014-10-06 16:30:06 -0400223 spin_lock_irqsave(&prison->lock, flags);
224 __cell_release_no_holder(prison, cell, inmates);
225 spin_unlock_irqrestore(&prison->lock, flags);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100226}
227EXPORT_SYMBOL_GPL(dm_cell_release_no_holder);
228
Joe Thornber6beca5e2013-03-01 22:45:50 +0000229void dm_cell_error(struct dm_bio_prison *prison,
Christoph Hellwig4e4cbee2017-06-03 09:38:06 +0200230 struct dm_bio_prison_cell *cell, blk_status_t error)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100231{
Mike Snitzer4f81a412012-10-12 21:02:13 +0100232 struct bio_list bios;
233 struct bio *bio;
Mike Snitzer4f81a412012-10-12 21:02:13 +0100234
235 bio_list_init(&bios);
Heinz Mauelshagenadcc4442014-06-05 15:23:09 +0100236 dm_cell_release(prison, cell, &bios);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100237
Christoph Hellwig4246a0b2015-07-20 15:29:37 +0200238 while ((bio = bio_list_pop(&bios))) {
Christoph Hellwig4e4cbee2017-06-03 09:38:06 +0200239 bio->bi_status = error;
Christoph Hellwig4246a0b2015-07-20 15:29:37 +0200240 bio_endio(bio);
241 }
Mike Snitzer4f81a412012-10-12 21:02:13 +0100242}
243EXPORT_SYMBOL_GPL(dm_cell_error);
244
Joe Thornber2d759a42014-10-10 15:27:16 +0100245void dm_cell_visit_release(struct dm_bio_prison *prison,
246 void (*visit_fn)(void *, struct dm_bio_prison_cell *),
247 void *context,
248 struct dm_bio_prison_cell *cell)
249{
Mikulas Patocka235bc862019-10-15 08:16:51 -0400250 spin_lock_irq(&prison->lock);
Joe Thornber2d759a42014-10-10 15:27:16 +0100251 visit_fn(context, cell);
252 rb_erase(&cell->node, &prison->cells);
Mikulas Patocka235bc862019-10-15 08:16:51 -0400253 spin_unlock_irq(&prison->lock);
Joe Thornber2d759a42014-10-10 15:27:16 +0100254}
255EXPORT_SYMBOL_GPL(dm_cell_visit_release);
256
Joe Thornber3cdf93f2015-05-15 15:23:35 +0100257static int __promote_or_release(struct dm_bio_prison *prison,
258 struct dm_bio_prison_cell *cell)
259{
260 if (bio_list_empty(&cell->bios)) {
261 rb_erase(&cell->node, &prison->cells);
262 return 1;
263 }
264
265 cell->holder = bio_list_pop(&cell->bios);
266 return 0;
267}
268
269int dm_cell_promote_or_release(struct dm_bio_prison *prison,
270 struct dm_bio_prison_cell *cell)
271{
272 int r;
Joe Thornber3cdf93f2015-05-15 15:23:35 +0100273
Mikulas Patocka235bc862019-10-15 08:16:51 -0400274 spin_lock_irq(&prison->lock);
Joe Thornber3cdf93f2015-05-15 15:23:35 +0100275 r = __promote_or_release(prison, cell);
Mikulas Patocka235bc862019-10-15 08:16:51 -0400276 spin_unlock_irq(&prison->lock);
Joe Thornber3cdf93f2015-05-15 15:23:35 +0100277
278 return r;
279}
280EXPORT_SYMBOL_GPL(dm_cell_promote_or_release);
281
Mike Snitzer4f81a412012-10-12 21:02:13 +0100282/*----------------------------------------------------------------*/
283
284#define DEFERRED_SET_SIZE 64
285
286struct dm_deferred_entry {
287 struct dm_deferred_set *ds;
288 unsigned count;
289 struct list_head work_items;
290};
291
292struct dm_deferred_set {
293 spinlock_t lock;
294 unsigned current_entry;
295 unsigned sweeper;
296 struct dm_deferred_entry entries[DEFERRED_SET_SIZE];
297};
298
299struct dm_deferred_set *dm_deferred_set_create(void)
300{
301 int i;
302 struct dm_deferred_set *ds;
303
304 ds = kmalloc(sizeof(*ds), GFP_KERNEL);
305 if (!ds)
306 return NULL;
307
308 spin_lock_init(&ds->lock);
309 ds->current_entry = 0;
310 ds->sweeper = 0;
311 for (i = 0; i < DEFERRED_SET_SIZE; i++) {
312 ds->entries[i].ds = ds;
313 ds->entries[i].count = 0;
314 INIT_LIST_HEAD(&ds->entries[i].work_items);
315 }
316
317 return ds;
318}
319EXPORT_SYMBOL_GPL(dm_deferred_set_create);
320
321void dm_deferred_set_destroy(struct dm_deferred_set *ds)
322{
323 kfree(ds);
324}
325EXPORT_SYMBOL_GPL(dm_deferred_set_destroy);
326
327struct dm_deferred_entry *dm_deferred_entry_inc(struct dm_deferred_set *ds)
328{
329 unsigned long flags;
330 struct dm_deferred_entry *entry;
331
332 spin_lock_irqsave(&ds->lock, flags);
333 entry = ds->entries + ds->current_entry;
334 entry->count++;
335 spin_unlock_irqrestore(&ds->lock, flags);
336
337 return entry;
338}
339EXPORT_SYMBOL_GPL(dm_deferred_entry_inc);
340
341static unsigned ds_next(unsigned index)
342{
343 return (index + 1) % DEFERRED_SET_SIZE;
344}
345
346static void __sweep(struct dm_deferred_set *ds, struct list_head *head)
347{
348 while ((ds->sweeper != ds->current_entry) &&
349 !ds->entries[ds->sweeper].count) {
350 list_splice_init(&ds->entries[ds->sweeper].work_items, head);
351 ds->sweeper = ds_next(ds->sweeper);
352 }
353
354 if ((ds->sweeper == ds->current_entry) && !ds->entries[ds->sweeper].count)
355 list_splice_init(&ds->entries[ds->sweeper].work_items, head);
356}
357
358void dm_deferred_entry_dec(struct dm_deferred_entry *entry, struct list_head *head)
359{
360 unsigned long flags;
361
362 spin_lock_irqsave(&entry->ds->lock, flags);
363 BUG_ON(!entry->count);
364 --entry->count;
365 __sweep(entry->ds, head);
366 spin_unlock_irqrestore(&entry->ds->lock, flags);
367}
368EXPORT_SYMBOL_GPL(dm_deferred_entry_dec);
369
370/*
371 * Returns 1 if deferred or 0 if no pending items to delay job.
372 */
373int dm_deferred_set_add_work(struct dm_deferred_set *ds, struct list_head *work)
374{
375 int r = 1;
Mike Snitzer4f81a412012-10-12 21:02:13 +0100376 unsigned next_entry;
377
Mikulas Patocka235bc862019-10-15 08:16:51 -0400378 spin_lock_irq(&ds->lock);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100379 if ((ds->sweeper == ds->current_entry) &&
380 !ds->entries[ds->current_entry].count)
381 r = 0;
382 else {
383 list_add(work, &ds->entries[ds->current_entry].work_items);
384 next_entry = ds_next(ds->current_entry);
385 if (!ds->entries[next_entry].count)
386 ds->current_entry = next_entry;
387 }
Mikulas Patocka235bc862019-10-15 08:16:51 -0400388 spin_unlock_irq(&ds->lock);
Mike Snitzer4f81a412012-10-12 21:02:13 +0100389
390 return r;
391}
392EXPORT_SYMBOL_GPL(dm_deferred_set_add_work);
393
394/*----------------------------------------------------------------*/
395
Joe Thornber742c8fd2016-10-21 10:06:40 -0400396static int __init dm_bio_prison_init_v1(void)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100397{
398 _cell_cache = KMEM_CACHE(dm_bio_prison_cell, 0);
399 if (!_cell_cache)
400 return -ENOMEM;
401
402 return 0;
403}
404
Joe Thornber742c8fd2016-10-21 10:06:40 -0400405static void dm_bio_prison_exit_v1(void)
Mike Snitzer4f81a412012-10-12 21:02:13 +0100406{
407 kmem_cache_destroy(_cell_cache);
408 _cell_cache = NULL;
409}
410
Joe Thornber742c8fd2016-10-21 10:06:40 -0400411static int (*_inits[])(void) __initdata = {
412 dm_bio_prison_init_v1,
413 dm_bio_prison_init_v2,
414};
415
416static void (*_exits[])(void) = {
417 dm_bio_prison_exit_v1,
418 dm_bio_prison_exit_v2,
419};
420
421static int __init dm_bio_prison_init(void)
422{
423 const int count = ARRAY_SIZE(_inits);
424
425 int r, i;
426
427 for (i = 0; i < count; i++) {
428 r = _inits[i]();
429 if (r)
430 goto bad;
431 }
432
433 return 0;
434
435 bad:
436 while (i--)
437 _exits[i]();
438
439 return r;
440}
441
442static void __exit dm_bio_prison_exit(void)
443{
444 int i = ARRAY_SIZE(_exits);
445
446 while (i--)
447 _exits[i]();
448}
449
Mike Snitzer4f81a412012-10-12 21:02:13 +0100450/*
451 * module hooks
452 */
453module_init(dm_bio_prison_init);
454module_exit(dm_bio_prison_exit);
455
456MODULE_DESCRIPTION(DM_NAME " bio prison");
457MODULE_AUTHOR("Joe Thornber <dm-devel@redhat.com>");
458MODULE_LICENSE("GPL");