Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2007 Oracle. All rights reserved. |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 3 | * Copyright (C) 2014 Fujitsu. All rights reserved. |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 4 | * |
| 5 | * This program is free software; you can redistribute it and/or |
| 6 | * modify it under the terms of the GNU General Public |
| 7 | * License v2 as published by the Free Software Foundation. |
| 8 | * |
| 9 | * This program is distributed in the hope that it will be useful, |
| 10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 12 | * General Public License for more details. |
| 13 | * |
| 14 | * You should have received a copy of the GNU General Public |
| 15 | * License along with this program; if not, write to the |
| 16 | * Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
| 17 | * Boston, MA 021110-1307, USA. |
| 18 | */ |
| 19 | |
| 20 | #include <linux/kthread.h> |
Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 21 | #include <linux/slab.h> |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 22 | #include <linux/list.h> |
| 23 | #include <linux/spinlock.h> |
Chris Mason | b51912c | 2009-02-04 09:23:24 -0500 | [diff] [blame] | 24 | #include <linux/freezer.h> |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 25 | #include <linux/workqueue.h> |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 26 | #include "async-thread.h" |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 27 | #include "ctree.h" |
Chris Mason | 8b71284 | 2008-06-11 16:50:36 -0400 | [diff] [blame] | 28 | |
Qu Wenruo | a046e9c | 2014-02-28 10:46:18 +0800 | [diff] [blame] | 29 | #define WORK_DONE_BIT 0 |
| 30 | #define WORK_ORDER_DONE_BIT 1 |
| 31 | #define WORK_HIGH_PRIO_BIT 2 |
Chris Mason | 4a69a41 | 2008-11-06 22:03:00 -0500 | [diff] [blame] | 32 | |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 33 | #define NO_THRESHOLD (-1) |
| 34 | #define DFT_THRESHOLD (32) |
| 35 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 36 | struct __btrfs_workqueue { |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 37 | struct workqueue_struct *normal_wq; |
| 38 | /* List head pointing to ordered work list */ |
| 39 | struct list_head ordered_list; |
| 40 | |
| 41 | /* Spinlock for ordered_list */ |
| 42 | spinlock_t list_lock; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 43 | |
| 44 | /* Thresholding related variants */ |
| 45 | atomic_t pending; |
| 46 | int max_active; |
| 47 | int current_max; |
| 48 | int thresh; |
| 49 | unsigned int count; |
| 50 | spinlock_t thres_lock; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 51 | }; |
| 52 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 53 | struct btrfs_workqueue { |
| 54 | struct __btrfs_workqueue *normal; |
| 55 | struct __btrfs_workqueue *high; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 56 | }; |
| 57 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 58 | static inline struct __btrfs_workqueue |
Qu Wenruo | c3a4689 | 2014-03-12 08:05:33 +0000 | [diff] [blame^] | 59 | *__btrfs_alloc_workqueue(const char *name, int flags, int max_active, |
| 60 | int thresh) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 61 | { |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 62 | struct __btrfs_workqueue *ret = kzalloc(sizeof(*ret), GFP_NOFS); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 63 | |
| 64 | if (unlikely(!ret)) |
| 65 | return NULL; |
| 66 | |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 67 | ret->max_active = max_active; |
| 68 | atomic_set(&ret->pending, 0); |
| 69 | if (thresh == 0) |
| 70 | thresh = DFT_THRESHOLD; |
| 71 | /* For low threshold, disabling threshold is a better choice */ |
| 72 | if (thresh < DFT_THRESHOLD) { |
| 73 | ret->current_max = max_active; |
| 74 | ret->thresh = NO_THRESHOLD; |
| 75 | } else { |
| 76 | ret->current_max = 1; |
| 77 | ret->thresh = thresh; |
| 78 | } |
| 79 | |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 80 | if (flags & WQ_HIGHPRI) |
| 81 | ret->normal_wq = alloc_workqueue("%s-%s-high", flags, |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 82 | ret->max_active, |
| 83 | "btrfs", name); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 84 | else |
| 85 | ret->normal_wq = alloc_workqueue("%s-%s", flags, |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 86 | ret->max_active, "btrfs", |
| 87 | name); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 88 | if (unlikely(!ret->normal_wq)) { |
| 89 | kfree(ret); |
| 90 | return NULL; |
| 91 | } |
| 92 | |
| 93 | INIT_LIST_HEAD(&ret->ordered_list); |
| 94 | spin_lock_init(&ret->list_lock); |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 95 | spin_lock_init(&ret->thres_lock); |
Qu Wenruo | c3a4689 | 2014-03-12 08:05:33 +0000 | [diff] [blame^] | 96 | trace_btrfs_workqueue_alloc(ret, name, flags & WQ_HIGHPRI); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 97 | return ret; |
| 98 | } |
| 99 | |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 100 | static inline void |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 101 | __btrfs_destroy_workqueue(struct __btrfs_workqueue *wq); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 102 | |
Qu Wenruo | c3a4689 | 2014-03-12 08:05:33 +0000 | [diff] [blame^] | 103 | struct btrfs_workqueue *btrfs_alloc_workqueue(const char *name, |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 104 | int flags, |
| 105 | int max_active, |
| 106 | int thresh) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 107 | { |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 108 | struct btrfs_workqueue *ret = kzalloc(sizeof(*ret), GFP_NOFS); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 109 | |
| 110 | if (unlikely(!ret)) |
| 111 | return NULL; |
| 112 | |
| 113 | ret->normal = __btrfs_alloc_workqueue(name, flags & ~WQ_HIGHPRI, |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 114 | max_active, thresh); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 115 | if (unlikely(!ret->normal)) { |
| 116 | kfree(ret); |
| 117 | return NULL; |
| 118 | } |
| 119 | |
| 120 | if (flags & WQ_HIGHPRI) { |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 121 | ret->high = __btrfs_alloc_workqueue(name, flags, max_active, |
| 122 | thresh); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 123 | if (unlikely(!ret->high)) { |
| 124 | __btrfs_destroy_workqueue(ret->normal); |
| 125 | kfree(ret); |
| 126 | return NULL; |
| 127 | } |
| 128 | } |
| 129 | return ret; |
| 130 | } |
| 131 | |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 132 | /* |
| 133 | * Hook for threshold which will be called in btrfs_queue_work. |
| 134 | * This hook WILL be called in IRQ handler context, |
| 135 | * so workqueue_set_max_active MUST NOT be called in this hook |
| 136 | */ |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 137 | static inline void thresh_queue_hook(struct __btrfs_workqueue *wq) |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 138 | { |
| 139 | if (wq->thresh == NO_THRESHOLD) |
| 140 | return; |
| 141 | atomic_inc(&wq->pending); |
| 142 | } |
| 143 | |
| 144 | /* |
| 145 | * Hook for threshold which will be called before executing the work, |
| 146 | * This hook is called in kthread content. |
| 147 | * So workqueue_set_max_active is called here. |
| 148 | */ |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 149 | static inline void thresh_exec_hook(struct __btrfs_workqueue *wq) |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 150 | { |
| 151 | int new_max_active; |
| 152 | long pending; |
| 153 | int need_change = 0; |
| 154 | |
| 155 | if (wq->thresh == NO_THRESHOLD) |
| 156 | return; |
| 157 | |
| 158 | atomic_dec(&wq->pending); |
| 159 | spin_lock(&wq->thres_lock); |
| 160 | /* |
| 161 | * Use wq->count to limit the calling frequency of |
| 162 | * workqueue_set_max_active. |
| 163 | */ |
| 164 | wq->count++; |
| 165 | wq->count %= (wq->thresh / 4); |
| 166 | if (!wq->count) |
| 167 | goto out; |
| 168 | new_max_active = wq->current_max; |
| 169 | |
| 170 | /* |
| 171 | * pending may be changed later, but it's OK since we really |
| 172 | * don't need it so accurate to calculate new_max_active. |
| 173 | */ |
| 174 | pending = atomic_read(&wq->pending); |
| 175 | if (pending > wq->thresh) |
| 176 | new_max_active++; |
| 177 | if (pending < wq->thresh / 2) |
| 178 | new_max_active--; |
| 179 | new_max_active = clamp_val(new_max_active, 1, wq->max_active); |
| 180 | if (new_max_active != wq->current_max) { |
| 181 | need_change = 1; |
| 182 | wq->current_max = new_max_active; |
| 183 | } |
| 184 | out: |
| 185 | spin_unlock(&wq->thres_lock); |
| 186 | |
| 187 | if (need_change) { |
| 188 | workqueue_set_max_active(wq->normal_wq, wq->current_max); |
| 189 | } |
| 190 | } |
| 191 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 192 | static void run_ordered_work(struct __btrfs_workqueue *wq) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 193 | { |
| 194 | struct list_head *list = &wq->ordered_list; |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 195 | struct btrfs_work *work; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 196 | spinlock_t *lock = &wq->list_lock; |
| 197 | unsigned long flags; |
| 198 | |
| 199 | while (1) { |
| 200 | spin_lock_irqsave(lock, flags); |
| 201 | if (list_empty(list)) |
| 202 | break; |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 203 | work = list_entry(list->next, struct btrfs_work, |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 204 | ordered_list); |
| 205 | if (!test_bit(WORK_DONE_BIT, &work->flags)) |
| 206 | break; |
| 207 | |
| 208 | /* |
| 209 | * we are going to call the ordered done function, but |
| 210 | * we leave the work item on the list as a barrier so |
| 211 | * that later work items that are done don't have their |
| 212 | * functions called before this one returns |
| 213 | */ |
| 214 | if (test_and_set_bit(WORK_ORDER_DONE_BIT, &work->flags)) |
| 215 | break; |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 216 | trace_btrfs_ordered_sched(work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 217 | spin_unlock_irqrestore(lock, flags); |
| 218 | work->ordered_func(work); |
| 219 | |
| 220 | /* now take the lock again and drop our item from the list */ |
| 221 | spin_lock_irqsave(lock, flags); |
| 222 | list_del(&work->ordered_list); |
| 223 | spin_unlock_irqrestore(lock, flags); |
| 224 | |
| 225 | /* |
| 226 | * we don't want to call the ordered free functions |
| 227 | * with the lock held though |
| 228 | */ |
| 229 | work->ordered_free(work); |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 230 | trace_btrfs_all_work_done(work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 231 | } |
| 232 | spin_unlock_irqrestore(lock, flags); |
| 233 | } |
| 234 | |
| 235 | static void normal_work_helper(struct work_struct *arg) |
| 236 | { |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 237 | struct btrfs_work *work; |
| 238 | struct __btrfs_workqueue *wq; |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 239 | int need_order = 0; |
| 240 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 241 | work = container_of(arg, struct btrfs_work, normal_work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 242 | /* |
| 243 | * We should not touch things inside work in the following cases: |
| 244 | * 1) after work->func() if it has no ordered_free |
| 245 | * Since the struct is freed in work->func(). |
| 246 | * 2) after setting WORK_DONE_BIT |
| 247 | * The work may be freed in other threads almost instantly. |
| 248 | * So we save the needed things here. |
| 249 | */ |
| 250 | if (work->ordered_func) |
| 251 | need_order = 1; |
| 252 | wq = work->wq; |
| 253 | |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 254 | trace_btrfs_work_sched(work); |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 255 | thresh_exec_hook(wq); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 256 | work->func(work); |
| 257 | if (need_order) { |
| 258 | set_bit(WORK_DONE_BIT, &work->flags); |
| 259 | run_ordered_work(wq); |
| 260 | } |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 261 | if (!need_order) |
| 262 | trace_btrfs_all_work_done(work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 263 | } |
| 264 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 265 | void btrfs_init_work(struct btrfs_work *work, |
Qu Wenruo | 6db8914 | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 266 | btrfs_func_t func, |
| 267 | btrfs_func_t ordered_func, |
| 268 | btrfs_func_t ordered_free) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 269 | { |
| 270 | work->func = func; |
| 271 | work->ordered_func = ordered_func; |
| 272 | work->ordered_free = ordered_free; |
| 273 | INIT_WORK(&work->normal_work, normal_work_helper); |
| 274 | INIT_LIST_HEAD(&work->ordered_list); |
| 275 | work->flags = 0; |
| 276 | } |
| 277 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 278 | static inline void __btrfs_queue_work(struct __btrfs_workqueue *wq, |
| 279 | struct btrfs_work *work) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 280 | { |
| 281 | unsigned long flags; |
| 282 | |
| 283 | work->wq = wq; |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 284 | thresh_queue_hook(wq); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 285 | if (work->ordered_func) { |
| 286 | spin_lock_irqsave(&wq->list_lock, flags); |
| 287 | list_add_tail(&work->ordered_list, &wq->ordered_list); |
| 288 | spin_unlock_irqrestore(&wq->list_lock, flags); |
| 289 | } |
| 290 | queue_work(wq->normal_wq, &work->normal_work); |
Qu Wenruo | 52483bc | 2014-03-06 04:19:50 +0000 | [diff] [blame] | 291 | trace_btrfs_work_queued(work); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 292 | } |
| 293 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 294 | void btrfs_queue_work(struct btrfs_workqueue *wq, |
| 295 | struct btrfs_work *work) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 296 | { |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 297 | struct __btrfs_workqueue *dest_wq; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 298 | |
| 299 | if (test_bit(WORK_HIGH_PRIO_BIT, &work->flags) && wq->high) |
| 300 | dest_wq = wq->high; |
| 301 | else |
| 302 | dest_wq = wq->normal; |
| 303 | __btrfs_queue_work(dest_wq, work); |
| 304 | } |
| 305 | |
| 306 | static inline void |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 307 | __btrfs_destroy_workqueue(struct __btrfs_workqueue *wq) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 308 | { |
| 309 | destroy_workqueue(wq->normal_wq); |
Qu Wenruo | c3a4689 | 2014-03-12 08:05:33 +0000 | [diff] [blame^] | 310 | trace_btrfs_workqueue_destroy(wq); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 311 | kfree(wq); |
| 312 | } |
| 313 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 314 | void btrfs_destroy_workqueue(struct btrfs_workqueue *wq) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 315 | { |
| 316 | if (!wq) |
| 317 | return; |
| 318 | if (wq->high) |
| 319 | __btrfs_destroy_workqueue(wq->high); |
| 320 | __btrfs_destroy_workqueue(wq->normal); |
Filipe Manana | ef66af1 | 2014-03-11 14:31:44 +0000 | [diff] [blame] | 321 | kfree(wq); |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 322 | } |
| 323 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 324 | void btrfs_workqueue_set_max(struct btrfs_workqueue *wq, int max) |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 325 | { |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 326 | wq->normal->max_active = max; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 327 | if (wq->high) |
Qu Wenruo | 0bd9289 | 2014-02-28 10:46:05 +0800 | [diff] [blame] | 328 | wq->high->max_active = max; |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 329 | } |
| 330 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 331 | void btrfs_set_work_high_priority(struct btrfs_work *work) |
Qu Wenruo | 1ca0897 | 2014-02-28 10:46:04 +0800 | [diff] [blame] | 332 | { |
| 333 | set_bit(WORK_HIGH_PRIO_BIT, &work->flags); |
Qu Wenruo | 08a9ff3 | 2014-02-28 10:46:03 +0800 | [diff] [blame] | 334 | } |