David Sterba | c1d7c51 | 2018-04-03 19:23:33 +0200 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 2 | /* |
| 3 | * Copyright (C) 2007 Oracle. All rights reserved. |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 4 | * Copyright (C) 2014 Fujitsu. All rights reserved. |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 5 | */ |
| 6 | |
| 7 | #include <linux/kthread.h> |
Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 8 | #include <linux/slab.h> |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 9 | #include <linux/list.h> |
| 10 | #include <linux/spinlock.h> |
Chris Mason | b51912c | 2009-02-04 09:23:24 -0500 | [diff] [blame] | 11 | #include <linux/freezer.h> |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 12 | #include "async-thread.h" |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 13 | #include "ctree.h" |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 14 | |
David Sterba | f64ce7b | 2019-08-01 14:50:33 +0200 | [diff] [blame] | 15 | enum { |
| 16 | WORK_DONE_BIT, |
| 17 | WORK_ORDER_DONE_BIT, |
| 18 | WORK_HIGH_PRIO_BIT, |
| 19 | }; |
Chris Mason | 4a69a41 | 2008-11-06 22:03:00 -0500 | [diff] [blame] | 20 | |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 21 | #define NO_THRESHOLD (-1) |
| 22 | #define DFT_THRESHOLD (32) |
| 23 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 24 | struct __btrfs_workqueue { |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 25 | struct workqueue_struct *normal_wq; |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 26 | |
| 27 | /* File system this workqueue services */ |
| 28 | struct btrfs_fs_info *fs_info; |
| 29 | |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 30 | /* List head pointing to ordered work list */ |
| 31 | struct list_head ordered_list; |
| 32 | |
| 33 | /* Spinlock for ordered_list */ |
| 34 | spinlock_t list_lock; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 35 | |
| 36 | /* Thresholding related variants */ |
| 37 | atomic_t pending; |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 38 | |
| 39 | /* Up limit of concurrency workers */ |
| 40 | int limit_active; |
| 41 | |
| 42 | /* Current number of concurrency workers */ |
| 43 | int current_active; |
| 44 | |
| 45 | /* Threshold to change current_active */ |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 46 | int thresh; |
| 47 | unsigned int count; |
| 48 | spinlock_t thres_lock; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 49 | }; |
| 50 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 51 | struct btrfs_workqueue { |
| 52 | struct __btrfs_workqueue *normal; |
| 53 | struct __btrfs_workqueue *high; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 54 | }; |
| 55 | |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 56 | static void normal_work_helper(struct btrfs_work *work); |
| 57 | |
| 58 | #define BTRFS_WORK_HELPER(name) \ |
Liu Bo | 6939f66 | 2017-09-13 12:09:28 -0600 | [diff] [blame] | 59 | noinline_for_stack void btrfs_##name(struct work_struct *arg) \ |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 60 | { \ |
| 61 | struct btrfs_work *work = container_of(arg, struct btrfs_work, \ |
| 62 | normal_work); \ |
| 63 | normal_work_helper(work); \ |
| 64 | } |
| 65 | |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 66 | struct btrfs_fs_info * |
Jeff Mahoney | 9a35b63 | 2017-06-28 21:56:54 -0600 | [diff] [blame] | 67 | btrfs_workqueue_owner(const struct __btrfs_workqueue *wq) |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 68 | { |
| 69 | return wq->fs_info; |
| 70 | } |
| 71 | |
| 72 | struct btrfs_fs_info * |
Jeff Mahoney | 9a35b63 | 2017-06-28 21:56:54 -0600 | [diff] [blame] | 73 | btrfs_work_owner(const struct btrfs_work *work) |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 74 | { |
| 75 | return work->wq->fs_info; |
| 76 | } |
| 77 | |
Jeff Mahoney | 9a35b63 | 2017-06-28 21:56:54 -0600 | [diff] [blame] | 78 | bool btrfs_workqueue_normal_congested(const struct btrfs_workqueue *wq) |
Maxim Patlasov | 2939e1a | 2016-12-12 14:32:44 -0800 | [diff] [blame] | 79 | { |
| 80 | /* |
| 81 | * We could compare wq->normal->pending with num_online_cpus() |
| 82 | * to support "thresh == NO_THRESHOLD" case, but it requires |
| 83 | * moving up atomic_inc/dec in thresh_queue/exec_hook. Let's |
| 84 | * postpone it until someone needs the support of that case. |
| 85 | */ |
| 86 | if (wq->normal->thresh == NO_THRESHOLD) |
| 87 | return false; |
| 88 | |
| 89 | return atomic_read(&wq->normal->pending) > wq->normal->thresh * 2; |
| 90 | } |
| 91 | |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 92 | BTRFS_WORK_HELPER(worker_helper); |
| 93 | BTRFS_WORK_HELPER(delalloc_helper); |
| 94 | BTRFS_WORK_HELPER(flush_delalloc_helper); |
| 95 | BTRFS_WORK_HELPER(cache_helper); |
| 96 | BTRFS_WORK_HELPER(submit_helper); |
| 97 | BTRFS_WORK_HELPER(fixup_helper); |
| 98 | BTRFS_WORK_HELPER(endio_helper); |
| 99 | BTRFS_WORK_HELPER(endio_meta_helper); |
| 100 | BTRFS_WORK_HELPER(endio_meta_write_helper); |
| 101 | BTRFS_WORK_HELPER(endio_raid56_helper); |
Miao Xie | 8b110e3 | 2014-09-12 18:44:03 +0800 | [diff] [blame] | 102 | BTRFS_WORK_HELPER(endio_repair_helper); |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 103 | BTRFS_WORK_HELPER(rmw_helper); |
| 104 | BTRFS_WORK_HELPER(endio_write_helper); |
| 105 | BTRFS_WORK_HELPER(freespace_write_helper); |
| 106 | BTRFS_WORK_HELPER(delayed_meta_helper); |
| 107 | BTRFS_WORK_HELPER(readahead_helper); |
| 108 | BTRFS_WORK_HELPER(qgroup_rescan_helper); |
| 109 | BTRFS_WORK_HELPER(extent_refs_helper); |
| 110 | BTRFS_WORK_HELPER(scrub_helper); |
| 111 | BTRFS_WORK_HELPER(scrubwrc_helper); |
| 112 | BTRFS_WORK_HELPER(scrubnc_helper); |
Zhao Lei | 20b2e30 | 2015-06-04 20:09:15 +0800 | [diff] [blame] | 113 | BTRFS_WORK_HELPER(scrubparity_helper); |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 114 | |
| 115 | static struct __btrfs_workqueue * |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 116 | __btrfs_alloc_workqueue(struct btrfs_fs_info *fs_info, const char *name, |
| 117 | unsigned int flags, int limit_active, int thresh) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 118 | { |
David Sterba | 61dd5ae | 2015-12-01 18:04:30 +0100 | [diff] [blame] | 119 | struct __btrfs_workqueue *ret = kzalloc(sizeof(*ret), GFP_KERNEL); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 120 | |
David Sterba | 5d99a998 | 2014-09-29 19:20:37 +0200 | [diff] [blame] | 121 | if (!ret) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 122 | return NULL; |
| 123 | |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 124 | ret->fs_info = fs_info; |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 125 | ret->limit_active = limit_active; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 126 | atomic_set(&ret->pending, 0); |
| 127 | if (thresh == 0) |
| 128 | thresh = DFT_THRESHOLD; |
| 129 | /* For low threshold, disabling threshold is a better choice */ |
| 130 | if (thresh < DFT_THRESHOLD) { |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 131 | ret->current_active = limit_active; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 132 | ret->thresh = NO_THRESHOLD; |
| 133 | } else { |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 134 | /* |
| 135 | * For threshold-able wq, let its concurrency grow on demand. |
| 136 | * Use minimal max_active at alloc time to reduce resource |
| 137 | * usage. |
| 138 | */ |
| 139 | ret->current_active = 1; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 140 | ret->thresh = thresh; |
| 141 | } |
| 142 | |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 143 | if (flags & WQ_HIGHPRI) |
David Sterba | ce3ded1 | 2019-01-17 17:15:18 +0100 | [diff] [blame] | 144 | ret->normal_wq = alloc_workqueue("btrfs-%s-high", flags, |
| 145 | ret->current_active, name); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 146 | else |
David Sterba | ce3ded1 | 2019-01-17 17:15:18 +0100 | [diff] [blame] | 147 | ret->normal_wq = alloc_workqueue("btrfs-%s", flags, |
| 148 | ret->current_active, name); |
David Sterba | 5d99a998 | 2014-09-29 19:20:37 +0200 | [diff] [blame] | 149 | if (!ret->normal_wq) { |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 150 | kfree(ret); |
| 151 | return NULL; |
| 152 | } |
| 153 | |
| 154 | INIT_LIST_HEAD(&ret->ordered_list); |
| 155 | spin_lock_init(&ret->list_lock); |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 156 | spin_lock_init(&ret->thres_lock); |
Qu Wenruo | c3a4689 | 2014-03-12 08:05:33 +0000 | [diff] [blame] | 157 | trace_btrfs_workqueue_alloc(ret, name, flags & WQ_HIGHPRI); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 158 | return ret; |
| 159 | } |
| 160 | |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 161 | static inline void |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 162 | __btrfs_destroy_workqueue(struct __btrfs_workqueue *wq); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 163 | |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 164 | struct btrfs_workqueue *btrfs_alloc_workqueue(struct btrfs_fs_info *fs_info, |
| 165 | const char *name, |
David Sterba | 6f01105 | 2015-02-16 18:34:01 +0100 | [diff] [blame] | 166 | unsigned int flags, |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 167 | int limit_active, |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 168 | int thresh) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 169 | { |
David Sterba | 61dd5ae | 2015-12-01 18:04:30 +0100 | [diff] [blame] | 170 | struct btrfs_workqueue *ret = kzalloc(sizeof(*ret), GFP_KERNEL); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 171 | |
David Sterba | 5d99a998 | 2014-09-29 19:20:37 +0200 | [diff] [blame] | 172 | if (!ret) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 173 | return NULL; |
| 174 | |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 175 | ret->normal = __btrfs_alloc_workqueue(fs_info, name, |
| 176 | flags & ~WQ_HIGHPRI, |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 177 | limit_active, thresh); |
David Sterba | 5d99a998 | 2014-09-29 19:20:37 +0200 | [diff] [blame] | 178 | if (!ret->normal) { |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 179 | kfree(ret); |
| 180 | return NULL; |
| 181 | } |
| 182 | |
| 183 | if (flags & WQ_HIGHPRI) { |
Jeff Mahoney | cb00109 | 2016-06-09 16:22:11 -0400 | [diff] [blame] | 184 | ret->high = __btrfs_alloc_workqueue(fs_info, name, flags, |
| 185 | limit_active, thresh); |
David Sterba | 5d99a998 | 2014-09-29 19:20:37 +0200 | [diff] [blame] | 186 | if (!ret->high) { |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 187 | __btrfs_destroy_workqueue(ret->normal); |
| 188 | kfree(ret); |
| 189 | return NULL; |
| 190 | } |
| 191 | } |
| 192 | return ret; |
| 193 | } |
| 194 | |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 195 | /* |
| 196 | * Hook for threshold which will be called in btrfs_queue_work. |
| 197 | * This hook WILL be called in IRQ handler context, |
| 198 | * so workqueue_set_max_active MUST NOT be called in this hook |
| 199 | */ |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 200 | static inline void thresh_queue_hook(struct __btrfs_workqueue *wq) |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 201 | { |
| 202 | if (wq->thresh == NO_THRESHOLD) |
| 203 | return; |
| 204 | atomic_inc(&wq->pending); |
| 205 | } |
| 206 | |
| 207 | /* |
| 208 | * Hook for threshold which will be called before executing the work, |
| 209 | * This hook is called in kthread content. |
| 210 | * So workqueue_set_max_active is called here. |
| 211 | */ |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 212 | static inline void thresh_exec_hook(struct __btrfs_workqueue *wq) |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 213 | { |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 214 | int new_current_active; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 215 | long pending; |
| 216 | int need_change = 0; |
| 217 | |
| 218 | if (wq->thresh == NO_THRESHOLD) |
| 219 | return; |
| 220 | |
| 221 | atomic_dec(&wq->pending); |
| 222 | spin_lock(&wq->thres_lock); |
| 223 | /* |
| 224 | * Use wq->count to limit the calling frequency of |
| 225 | * workqueue_set_max_active. |
| 226 | */ |
| 227 | wq->count++; |
| 228 | wq->count %= (wq->thresh / 4); |
| 229 | if (!wq->count) |
| 230 | goto out; |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 231 | new_current_active = wq->current_active; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 232 | |
| 233 | /* |
| 234 | * pending may be changed later, but it's OK since we really |
| 235 | * don't need it so accurate to calculate new_max_active. |
| 236 | */ |
| 237 | pending = atomic_read(&wq->pending); |
| 238 | if (pending > wq->thresh) |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 239 | new_current_active++; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 240 | if (pending < wq->thresh / 2) |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 241 | new_current_active--; |
| 242 | new_current_active = clamp_val(new_current_active, 1, wq->limit_active); |
| 243 | if (new_current_active != wq->current_active) { |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 244 | need_change = 1; |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 245 | wq->current_active = new_current_active; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 246 | } |
| 247 | out: |
| 248 | spin_unlock(&wq->thres_lock); |
| 249 | |
| 250 | if (need_change) { |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 251 | workqueue_set_max_active(wq->normal_wq, wq->current_active); |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 252 | } |
| 253 | } |
| 254 | |
Omar Sandoval | c495dcd | 2019-09-16 11:30:53 -0700 | [diff] [blame^] | 255 | static void run_ordered_work(struct __btrfs_workqueue *wq, |
| 256 | struct btrfs_work *self) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 257 | { |
| 258 | struct list_head *list = &wq->ordered_list; |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 259 | struct btrfs_work *work; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 260 | spinlock_t *lock = &wq->list_lock; |
| 261 | unsigned long flags; |
Omar Sandoval | c495dcd | 2019-09-16 11:30:53 -0700 | [diff] [blame^] | 262 | void *wtag; |
| 263 | bool free_self = false; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 264 | |
| 265 | while (1) { |
| 266 | spin_lock_irqsave(lock, flags); |
| 267 | if (list_empty(list)) |
| 268 | break; |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 269 | work = list_entry(list->next, struct btrfs_work, |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 270 | ordered_list); |
| 271 | if (!test_bit(WORK_DONE_BIT, &work->flags)) |
| 272 | break; |
| 273 | |
| 274 | /* |
| 275 | * we are going to call the ordered done function, but |
| 276 | * we leave the work item on the list as a barrier so |
| 277 | * that later work items that are done don't have their |
| 278 | * functions called before this one returns |
| 279 | */ |
| 280 | if (test_and_set_bit(WORK_ORDER_DONE_BIT, &work->flags)) |
| 281 | break; |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 282 | trace_btrfs_ordered_sched(work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 283 | spin_unlock_irqrestore(lock, flags); |
| 284 | work->ordered_func(work); |
| 285 | |
| 286 | /* now take the lock again and drop our item from the list */ |
| 287 | spin_lock_irqsave(lock, flags); |
| 288 | list_del(&work->ordered_list); |
| 289 | spin_unlock_irqrestore(lock, flags); |
| 290 | |
Omar Sandoval | c495dcd | 2019-09-16 11:30:53 -0700 | [diff] [blame^] | 291 | if (work == self) { |
| 292 | /* |
| 293 | * This is the work item that the worker is currently |
| 294 | * executing. |
| 295 | * |
| 296 | * The kernel workqueue code guarantees non-reentrancy |
| 297 | * of work items. I.e., if a work item with the same |
| 298 | * address and work function is queued twice, the second |
| 299 | * execution is blocked until the first one finishes. A |
| 300 | * work item may be freed and recycled with the same |
| 301 | * work function; the workqueue code assumes that the |
| 302 | * original work item cannot depend on the recycled work |
| 303 | * item in that case (see find_worker_executing_work()). |
| 304 | * |
| 305 | * Note that the work of one Btrfs filesystem may depend |
| 306 | * on the work of another Btrfs filesystem via, e.g., a |
| 307 | * loop device. Therefore, we must not allow the current |
| 308 | * work item to be recycled until we are really done, |
| 309 | * otherwise we break the above assumption and can |
| 310 | * deadlock. |
| 311 | */ |
| 312 | free_self = true; |
| 313 | } else { |
| 314 | /* |
| 315 | * We don't want to call the ordered free functions with |
| 316 | * the lock held though. Save the work as tag for the |
| 317 | * trace event, because the callback could free the |
| 318 | * structure. |
| 319 | */ |
| 320 | wtag = work; |
| 321 | work->ordered_free(work); |
| 322 | trace_btrfs_all_work_done(wq->fs_info, wtag); |
| 323 | } |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 324 | } |
| 325 | spin_unlock_irqrestore(lock, flags); |
Omar Sandoval | c495dcd | 2019-09-16 11:30:53 -0700 | [diff] [blame^] | 326 | |
| 327 | if (free_self) { |
| 328 | wtag = self; |
| 329 | self->ordered_free(self); |
| 330 | trace_btrfs_all_work_done(wq->fs_info, wtag); |
| 331 | } |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 332 | } |
| 333 | |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 334 | static void normal_work_helper(struct btrfs_work *work) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 335 | { |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 336 | struct __btrfs_workqueue *wq; |
David Sterba | ac0c7cf | 2017-01-06 14:12:51 +0100 | [diff] [blame] | 337 | void *wtag; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 338 | int need_order = 0; |
| 339 | |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 340 | /* |
| 341 | * We should not touch things inside work in the following cases: |
| 342 | * 1) after work->func() if it has no ordered_free |
| 343 | * Since the struct is freed in work->func(). |
| 344 | * 2) after setting WORK_DONE_BIT |
| 345 | * The work may be freed in other threads almost instantly. |
| 346 | * So we save the needed things here. |
| 347 | */ |
| 348 | if (work->ordered_func) |
| 349 | need_order = 1; |
| 350 | wq = work->wq; |
David Sterba | ac0c7cf | 2017-01-06 14:12:51 +0100 | [diff] [blame] | 351 | /* Safe for tracepoints in case work gets freed by the callback */ |
| 352 | wtag = work; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 353 | |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 354 | trace_btrfs_work_sched(work); |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 355 | thresh_exec_hook(wq); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 356 | work->func(work); |
| 357 | if (need_order) { |
| 358 | set_bit(WORK_DONE_BIT, &work->flags); |
Omar Sandoval | c495dcd | 2019-09-16 11:30:53 -0700 | [diff] [blame^] | 359 | run_ordered_work(wq, work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 360 | } |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 361 | if (!need_order) |
David Sterba | ac0c7cf | 2017-01-06 14:12:51 +0100 | [diff] [blame] | 362 | trace_btrfs_all_work_done(wq->fs_info, wtag); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 363 | } |
| 364 | |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 365 | void btrfs_init_work(struct btrfs_work *work, btrfs_work_func_t uniq_func, |
Qu Wenruo | 6db8914 | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 366 | btrfs_func_t func, |
| 367 | btrfs_func_t ordered_func, |
| 368 | btrfs_func_t ordered_free) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 369 | { |
| 370 | work->func = func; |
| 371 | work->ordered_func = ordered_func; |
| 372 | work->ordered_free = ordered_free; |
Liu Bo | 9e0af23 | 2014-08-15 23:36:53 +0800 | [diff] [blame] | 373 | INIT_WORK(&work->normal_work, uniq_func); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 374 | INIT_LIST_HEAD(&work->ordered_list); |
| 375 | work->flags = 0; |
| 376 | } |
| 377 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 378 | static inline void __btrfs_queue_work(struct __btrfs_workqueue *wq, |
| 379 | struct btrfs_work *work) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 380 | { |
| 381 | unsigned long flags; |
| 382 | |
| 383 | work->wq = wq; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 384 | thresh_queue_hook(wq); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 385 | if (work->ordered_func) { |
| 386 | spin_lock_irqsave(&wq->list_lock, flags); |
| 387 | list_add_tail(&work->ordered_list, &wq->ordered_list); |
| 388 | spin_unlock_irqrestore(&wq->list_lock, flags); |
| 389 | } |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 390 | trace_btrfs_work_queued(work); |
Qu Wenruo | 0a95b85 | 2016-01-22 09:28:38 +0800 | [diff] [blame] | 391 | queue_work(wq->normal_wq, &work->normal_work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 392 | } |
| 393 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 394 | void btrfs_queue_work(struct btrfs_workqueue *wq, |
| 395 | struct btrfs_work *work) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 396 | { |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 397 | struct __btrfs_workqueue *dest_wq; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 398 | |
| 399 | if (test_bit(WORK_HIGH_PRIO_BIT, &work->flags) && wq->high) |
| 400 | dest_wq = wq->high; |
| 401 | else |
| 402 | dest_wq = wq->normal; |
| 403 | __btrfs_queue_work(dest_wq, work); |
| 404 | } |
| 405 | |
| 406 | static inline void |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 407 | __btrfs_destroy_workqueue(struct __btrfs_workqueue *wq) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 408 | { |
| 409 | destroy_workqueue(wq->normal_wq); |
Qu Wenruo | c3a4689 | 2014-03-12 08:05:33 +0000 | [diff] [blame] | 410 | trace_btrfs_workqueue_destroy(wq); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 411 | kfree(wq); |
| 412 | } |
| 413 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 414 | void btrfs_destroy_workqueue(struct btrfs_workqueue *wq) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 415 | { |
| 416 | if (!wq) |
| 417 | return; |
| 418 | if (wq->high) |
| 419 | __btrfs_destroy_workqueue(wq->high); |
| 420 | __btrfs_destroy_workqueue(wq->normal); |
Filipe Manana | ef66af1 | 2014-03-11 14:31:44 +0000 | [diff] [blame] | 421 | kfree(wq); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 422 | } |
| 423 | |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 424 | void btrfs_workqueue_set_max(struct btrfs_workqueue *wq, int limit_active) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 425 | { |
Sergei Trofimovich | 800ee22 | 2014-04-07 10:55:46 +0300 | [diff] [blame] | 426 | if (!wq) |
| 427 | return; |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 428 | wq->normal->limit_active = limit_active; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 429 | if (wq->high) |
Qu Wenruo | c6dd6ea | 2015-08-20 09:30:39 +0800 | [diff] [blame] | 430 | wq->high->limit_active = limit_active; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 431 | } |
| 432 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 433 | void btrfs_set_work_high_priority(struct btrfs_work *work) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 434 | { |
| 435 | set_bit(WORK_HIGH_PRIO_BIT, &work->flags); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 436 | } |