blob: 90e72b9f4b94eed6d1b20ee611f1521a9a93db73 [file] [log] [blame]
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -05001// SPDX-License-Identifier: GPL-2.0+
2/*
3 * XArray implementation
Matthew Wilcox (Oracle)c44aa5e2020-01-17 22:13:21 -05004 * Copyright (c) 2017-2018 Microsoft Corporation
5 * Copyright (c) 2018-2020 Oracle
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -05006 * Author: Matthew Wilcox <willy@infradead.org>
7 */
8
Matthew Wilcox9b89a032017-11-10 09:34:31 -05009#include <linux/bitmap.h>
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -050010#include <linux/export.h>
Matthew Wilcox58d6ea32017-11-10 15:15:08 -050011#include <linux/list.h>
12#include <linux/slab.h>
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -050013#include <linux/xarray.h>
14
15/*
16 * Coding conventions in this file:
17 *
18 * @xa is used to refer to the entire xarray.
19 * @xas is the 'xarray operation state'. It may be either a pointer to
20 * an xa_state, or an xa_state stored on the stack. This is an unfortunate
21 * ambiguity.
22 * @index is the index of the entry being operated on
23 * @mark is an xa_mark_t; a small number indicating one of the mark bits.
24 * @node refers to an xa_node; usually the primary one being operated on by
25 * this function.
26 * @offset is the index into the slots array inside an xa_node.
27 * @parent refers to the @xa_node closer to the head than @node.
28 * @entry refers to something stored in a slot in the xarray
29 */
30
Matthew Wilcox58d6ea32017-11-10 15:15:08 -050031static inline unsigned int xa_lock_type(const struct xarray *xa)
32{
33 return (__force unsigned int)xa->xa_flags & 3;
34}
35
36static inline void xas_lock_type(struct xa_state *xas, unsigned int lock_type)
37{
38 if (lock_type == XA_LOCK_IRQ)
39 xas_lock_irq(xas);
40 else if (lock_type == XA_LOCK_BH)
41 xas_lock_bh(xas);
42 else
43 xas_lock(xas);
44}
45
46static inline void xas_unlock_type(struct xa_state *xas, unsigned int lock_type)
47{
48 if (lock_type == XA_LOCK_IRQ)
49 xas_unlock_irq(xas);
50 else if (lock_type == XA_LOCK_BH)
51 xas_unlock_bh(xas);
52 else
53 xas_unlock(xas);
54}
55
Matthew Wilcox371c7522018-07-04 10:50:12 -040056static inline bool xa_track_free(const struct xarray *xa)
57{
58 return xa->xa_flags & XA_FLAGS_TRACK_FREE;
59}
60
Matthew Wilcox3ccaf572018-10-26 14:43:22 -040061static inline bool xa_zero_busy(const struct xarray *xa)
62{
63 return xa->xa_flags & XA_FLAGS_ZERO_BUSY;
64}
65
Matthew Wilcox9b89a032017-11-10 09:34:31 -050066static inline void xa_mark_set(struct xarray *xa, xa_mark_t mark)
67{
68 if (!(xa->xa_flags & XA_FLAGS_MARK(mark)))
69 xa->xa_flags |= XA_FLAGS_MARK(mark);
70}
71
72static inline void xa_mark_clear(struct xarray *xa, xa_mark_t mark)
73{
74 if (xa->xa_flags & XA_FLAGS_MARK(mark))
75 xa->xa_flags &= ~(XA_FLAGS_MARK(mark));
76}
77
78static inline unsigned long *node_marks(struct xa_node *node, xa_mark_t mark)
79{
80 return node->marks[(__force unsigned)mark];
81}
82
83static inline bool node_get_mark(struct xa_node *node,
84 unsigned int offset, xa_mark_t mark)
85{
86 return test_bit(offset, node_marks(node, mark));
87}
88
89/* returns true if the bit was set */
90static inline bool node_set_mark(struct xa_node *node, unsigned int offset,
91 xa_mark_t mark)
92{
93 return __test_and_set_bit(offset, node_marks(node, mark));
94}
95
96/* returns true if the bit was set */
97static inline bool node_clear_mark(struct xa_node *node, unsigned int offset,
98 xa_mark_t mark)
99{
100 return __test_and_clear_bit(offset, node_marks(node, mark));
101}
102
103static inline bool node_any_mark(struct xa_node *node, xa_mark_t mark)
104{
105 return !bitmap_empty(node_marks(node, mark), XA_CHUNK_SIZE);
106}
107
Matthew Wilcox371c7522018-07-04 10:50:12 -0400108static inline void node_mark_all(struct xa_node *node, xa_mark_t mark)
109{
110 bitmap_fill(node_marks(node, mark), XA_CHUNK_SIZE);
111}
112
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500113#define mark_inc(mark) do { \
114 mark = (__force xa_mark_t)((__force unsigned)(mark) + 1); \
115} while (0)
116
117/*
118 * xas_squash_marks() - Merge all marks to the first entry
119 * @xas: Array operation state.
120 *
121 * Set a mark on the first entry if any entry has it set. Clear marks on
122 * all sibling entries.
123 */
124static void xas_squash_marks(const struct xa_state *xas)
125{
126 unsigned int mark = 0;
127 unsigned int limit = xas->xa_offset + xas->xa_sibs + 1;
128
129 if (!xas->xa_sibs)
130 return;
131
132 do {
133 unsigned long *marks = xas->xa_node->marks[mark];
134 if (find_next_bit(marks, limit, xas->xa_offset + 1) == limit)
135 continue;
136 __set_bit(xas->xa_offset, marks);
137 bitmap_clear(marks, xas->xa_offset + 1, xas->xa_sibs);
138 } while (mark++ != (__force unsigned)XA_MARK_MAX);
139}
140
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500141/* extracts the offset within this node from the index */
142static unsigned int get_offset(unsigned long index, struct xa_node *node)
143{
144 return (index >> node->shift) & XA_CHUNK_MASK;
145}
146
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500147static void xas_set_offset(struct xa_state *xas)
148{
149 xas->xa_offset = get_offset(xas->xa_index, xas->xa_node);
150}
151
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500152/* move the index either forwards (find) or backwards (sibling slot) */
153static void xas_move_index(struct xa_state *xas, unsigned long offset)
154{
155 unsigned int shift = xas->xa_node->shift;
156 xas->xa_index &= ~XA_CHUNK_MASK << shift;
157 xas->xa_index += offset << shift;
158}
159
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500160static void xas_advance(struct xa_state *xas)
161{
162 xas->xa_offset++;
163 xas_move_index(xas, xas->xa_offset);
164}
165
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500166static void *set_bounds(struct xa_state *xas)
167{
168 xas->xa_node = XAS_BOUNDS;
169 return NULL;
170}
171
172/*
173 * Starts a walk. If the @xas is already valid, we assume that it's on
174 * the right path and just return where we've got to. If we're in an
175 * error state, return NULL. If the index is outside the current scope
176 * of the xarray, return NULL without changing @xas->xa_node. Otherwise
177 * set @xas->xa_node to NULL and return the current head of the array.
178 */
179static void *xas_start(struct xa_state *xas)
180{
181 void *entry;
182
183 if (xas_valid(xas))
184 return xas_reload(xas);
185 if (xas_error(xas))
186 return NULL;
187
188 entry = xa_head(xas->xa);
189 if (!xa_is_node(entry)) {
190 if (xas->xa_index)
191 return set_bounds(xas);
192 } else {
193 if ((xas->xa_index >> xa_to_node(entry)->shift) > XA_CHUNK_MASK)
194 return set_bounds(xas);
195 }
196
197 xas->xa_node = NULL;
198 return entry;
199}
200
201static void *xas_descend(struct xa_state *xas, struct xa_node *node)
202{
203 unsigned int offset = get_offset(xas->xa_index, node);
204 void *entry = xa_entry(xas->xa, node, offset);
205
206 xas->xa_node = node;
207 if (xa_is_sibling(entry)) {
208 offset = xa_to_sibling(entry);
209 entry = xa_entry(xas->xa, node, offset);
210 }
211
212 xas->xa_offset = offset;
213 return entry;
214}
215
216/**
217 * xas_load() - Load an entry from the XArray (advanced).
218 * @xas: XArray operation state.
219 *
220 * Usually walks the @xas to the appropriate state to load the entry
221 * stored at xa_index. However, it will do nothing and return %NULL if
222 * @xas is in an error state. xas_load() will never expand the tree.
223 *
224 * If the xa_state is set up to operate on a multi-index entry, xas_load()
225 * may return %NULL or an internal entry, even if there are entries
226 * present within the range specified by @xas.
227 *
228 * Context: Any context. The caller should hold the xa_lock or the RCU lock.
229 * Return: Usually an entry in the XArray, but see description for exceptions.
230 */
231void *xas_load(struct xa_state *xas)
232{
233 void *entry = xas_start(xas);
234
235 while (xa_is_node(entry)) {
236 struct xa_node *node = xa_to_node(entry);
237
238 if (xas->xa_shift > node->shift)
239 break;
240 entry = xas_descend(xas, node);
Matthew Wilcox76b4e522018-12-28 23:20:44 -0500241 if (node->shift == 0)
242 break;
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500243 }
244 return entry;
245}
246EXPORT_SYMBOL_GPL(xas_load);
247
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500248/* Move the radix tree node cache here */
249extern struct kmem_cache *radix_tree_node_cachep;
250extern void radix_tree_node_rcu_free(struct rcu_head *head);
251
252#define XA_RCU_FREE ((struct xarray *)1)
253
254static void xa_node_free(struct xa_node *node)
255{
256 XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
257 node->array = XA_RCU_FREE;
258 call_rcu(&node->rcu_head, radix_tree_node_rcu_free);
259}
260
261/*
262 * xas_destroy() - Free any resources allocated during the XArray operation.
263 * @xas: XArray operation state.
264 *
265 * This function is now internal-only.
266 */
267static void xas_destroy(struct xa_state *xas)
268{
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -0700269 struct xa_node *next, *node = xas->xa_alloc;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500270
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -0700271 while (node) {
272 XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
273 next = rcu_dereference_raw(node->parent);
274 radix_tree_node_rcu_free(&node->rcu_head);
275 xas->xa_alloc = node = next;
276 }
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500277}
278
279/**
280 * xas_nomem() - Allocate memory if needed.
281 * @xas: XArray operation state.
282 * @gfp: Memory allocation flags.
283 *
284 * If we need to add new nodes to the XArray, we try to allocate memory
285 * with GFP_NOWAIT while holding the lock, which will usually succeed.
286 * If it fails, @xas is flagged as needing memory to continue. The caller
287 * should drop the lock and call xas_nomem(). If xas_nomem() succeeds,
288 * the caller should retry the operation.
289 *
290 * Forward progress is guaranteed as one node is allocated here and
291 * stored in the xa_state where it will be found by xas_alloc(). More
292 * nodes will likely be found in the slab allocator, but we do not tie
293 * them up here.
294 *
295 * Return: true if memory was needed, and was successfully allocated.
296 */
297bool xas_nomem(struct xa_state *xas, gfp_t gfp)
298{
299 if (xas->xa_node != XA_ERROR(-ENOMEM)) {
300 xas_destroy(xas);
301 return false;
302 }
Johannes Weiner7b785642019-05-24 10:12:46 -0400303 if (xas->xa->xa_flags & XA_FLAGS_ACCOUNT)
304 gfp |= __GFP_ACCOUNT;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500305 xas->xa_alloc = kmem_cache_alloc(radix_tree_node_cachep, gfp);
306 if (!xas->xa_alloc)
307 return false;
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -0700308 xas->xa_alloc->parent = NULL;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500309 XA_NODE_BUG_ON(xas->xa_alloc, !list_empty(&xas->xa_alloc->private_list));
310 xas->xa_node = XAS_RESTART;
311 return true;
312}
313EXPORT_SYMBOL_GPL(xas_nomem);
314
315/*
316 * __xas_nomem() - Drop locks and allocate memory if needed.
317 * @xas: XArray operation state.
318 * @gfp: Memory allocation flags.
319 *
320 * Internal variant of xas_nomem().
321 *
322 * Return: true if memory was needed, and was successfully allocated.
323 */
324static bool __xas_nomem(struct xa_state *xas, gfp_t gfp)
325 __must_hold(xas->xa->xa_lock)
326{
327 unsigned int lock_type = xa_lock_type(xas->xa);
328
329 if (xas->xa_node != XA_ERROR(-ENOMEM)) {
330 xas_destroy(xas);
331 return false;
332 }
Johannes Weiner7b785642019-05-24 10:12:46 -0400333 if (xas->xa->xa_flags & XA_FLAGS_ACCOUNT)
334 gfp |= __GFP_ACCOUNT;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500335 if (gfpflags_allow_blocking(gfp)) {
336 xas_unlock_type(xas, lock_type);
337 xas->xa_alloc = kmem_cache_alloc(radix_tree_node_cachep, gfp);
338 xas_lock_type(xas, lock_type);
339 } else {
340 xas->xa_alloc = kmem_cache_alloc(radix_tree_node_cachep, gfp);
341 }
342 if (!xas->xa_alloc)
343 return false;
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -0700344 xas->xa_alloc->parent = NULL;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500345 XA_NODE_BUG_ON(xas->xa_alloc, !list_empty(&xas->xa_alloc->private_list));
346 xas->xa_node = XAS_RESTART;
347 return true;
348}
349
350static void xas_update(struct xa_state *xas, struct xa_node *node)
351{
352 if (xas->xa_update)
353 xas->xa_update(node);
354 else
355 XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
356}
357
358static void *xas_alloc(struct xa_state *xas, unsigned int shift)
359{
360 struct xa_node *parent = xas->xa_node;
361 struct xa_node *node = xas->xa_alloc;
362
363 if (xas_invalid(xas))
364 return NULL;
365
366 if (node) {
367 xas->xa_alloc = NULL;
368 } else {
Johannes Weiner7b785642019-05-24 10:12:46 -0400369 gfp_t gfp = GFP_NOWAIT | __GFP_NOWARN;
370
371 if (xas->xa->xa_flags & XA_FLAGS_ACCOUNT)
372 gfp |= __GFP_ACCOUNT;
373
374 node = kmem_cache_alloc(radix_tree_node_cachep, gfp);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500375 if (!node) {
376 xas_set_err(xas, -ENOMEM);
377 return NULL;
378 }
379 }
380
381 if (parent) {
382 node->offset = xas->xa_offset;
383 parent->count++;
384 XA_NODE_BUG_ON(node, parent->count > XA_CHUNK_SIZE);
385 xas_update(xas, parent);
386 }
387 XA_NODE_BUG_ON(node, shift > BITS_PER_LONG);
388 XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
389 node->shift = shift;
390 node->count = 0;
391 node->nr_values = 0;
392 RCU_INIT_POINTER(node->parent, xas->xa_node);
393 node->array = xas->xa;
394
395 return node;
396}
397
Matthew Wilcox0e9446c2018-08-15 14:13:29 -0400398#ifdef CONFIG_XARRAY_MULTI
399/* Returns the number of indices covered by a given xa_state */
400static unsigned long xas_size(const struct xa_state *xas)
401{
402 return (xas->xa_sibs + 1UL) << xas->xa_shift;
403}
404#endif
405
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500406/*
407 * Use this to calculate the maximum index that will need to be created
408 * in order to add the entry described by @xas. Because we cannot store a
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -0700409 * multi-index entry at index 0, the calculation is a little more complex
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500410 * than you might expect.
411 */
412static unsigned long xas_max(struct xa_state *xas)
413{
414 unsigned long max = xas->xa_index;
415
416#ifdef CONFIG_XARRAY_MULTI
417 if (xas->xa_shift || xas->xa_sibs) {
Matthew Wilcox0e9446c2018-08-15 14:13:29 -0400418 unsigned long mask = xas_size(xas) - 1;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500419 max |= mask;
420 if (mask == max)
421 max++;
422 }
423#endif
424
425 return max;
426}
427
428/* The maximum index that can be contained in the array without expanding it */
429static unsigned long max_index(void *entry)
430{
431 if (!xa_is_node(entry))
432 return 0;
433 return (XA_CHUNK_SIZE << xa_to_node(entry)->shift) - 1;
434}
435
436static void xas_shrink(struct xa_state *xas)
437{
438 struct xarray *xa = xas->xa;
439 struct xa_node *node = xas->xa_node;
440
441 for (;;) {
442 void *entry;
443
444 XA_NODE_BUG_ON(node, node->count > XA_CHUNK_SIZE);
445 if (node->count != 1)
446 break;
447 entry = xa_entry_locked(xa, node, 0);
448 if (!entry)
449 break;
450 if (!xa_is_node(entry) && node->shift)
451 break;
Matthew Wilcox3ccaf572018-10-26 14:43:22 -0400452 if (xa_is_zero(entry) && xa_zero_busy(xa))
453 entry = NULL;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500454 xas->xa_node = XAS_BOUNDS;
455
456 RCU_INIT_POINTER(xa->xa_head, entry);
Matthew Wilcox371c7522018-07-04 10:50:12 -0400457 if (xa_track_free(xa) && !node_get_mark(node, 0, XA_FREE_MARK))
458 xa_mark_clear(xa, XA_FREE_MARK);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500459
460 node->count = 0;
461 node->nr_values = 0;
462 if (!xa_is_node(entry))
463 RCU_INIT_POINTER(node->slots[0], XA_RETRY_ENTRY);
464 xas_update(xas, node);
465 xa_node_free(node);
466 if (!xa_is_node(entry))
467 break;
468 node = xa_to_node(entry);
469 node->parent = NULL;
470 }
471}
472
473/*
474 * xas_delete_node() - Attempt to delete an xa_node
475 * @xas: Array operation state.
476 *
477 * Attempts to delete the @xas->xa_node. This will fail if xa->node has
478 * a non-zero reference count.
479 */
480static void xas_delete_node(struct xa_state *xas)
481{
482 struct xa_node *node = xas->xa_node;
483
484 for (;;) {
485 struct xa_node *parent;
486
487 XA_NODE_BUG_ON(node, node->count > XA_CHUNK_SIZE);
488 if (node->count)
489 break;
490
491 parent = xa_parent_locked(xas->xa, node);
492 xas->xa_node = parent;
493 xas->xa_offset = node->offset;
494 xa_node_free(node);
495
496 if (!parent) {
497 xas->xa->xa_head = NULL;
498 xas->xa_node = XAS_BOUNDS;
499 return;
500 }
501
502 parent->slots[xas->xa_offset] = NULL;
503 parent->count--;
504 XA_NODE_BUG_ON(parent, parent->count > XA_CHUNK_SIZE);
505 node = parent;
506 xas_update(xas, node);
507 }
508
509 if (!node->parent)
510 xas_shrink(xas);
511}
512
513/**
514 * xas_free_nodes() - Free this node and all nodes that it references
515 * @xas: Array operation state.
516 * @top: Node to free
517 *
518 * This node has been removed from the tree. We must now free it and all
519 * of its subnodes. There may be RCU walkers with references into the tree,
520 * so we must replace all entries with retry markers.
521 */
522static void xas_free_nodes(struct xa_state *xas, struct xa_node *top)
523{
524 unsigned int offset = 0;
525 struct xa_node *node = top;
526
527 for (;;) {
528 void *entry = xa_entry_locked(xas->xa, node, offset);
529
Matthew Wilcox76b4e522018-12-28 23:20:44 -0500530 if (node->shift && xa_is_node(entry)) {
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500531 node = xa_to_node(entry);
532 offset = 0;
533 continue;
534 }
535 if (entry)
536 RCU_INIT_POINTER(node->slots[offset], XA_RETRY_ENTRY);
537 offset++;
538 while (offset == XA_CHUNK_SIZE) {
539 struct xa_node *parent;
540
541 parent = xa_parent_locked(xas->xa, node);
542 offset = node->offset + 1;
543 node->count = 0;
544 node->nr_values = 0;
545 xas_update(xas, node);
546 xa_node_free(node);
547 if (node == top)
548 return;
549 node = parent;
550 }
551 }
552}
553
554/*
555 * xas_expand adds nodes to the head of the tree until it has reached
556 * sufficient height to be able to contain @xas->xa_index
557 */
558static int xas_expand(struct xa_state *xas, void *head)
559{
560 struct xarray *xa = xas->xa;
561 struct xa_node *node = NULL;
562 unsigned int shift = 0;
563 unsigned long max = xas_max(xas);
564
565 if (!head) {
566 if (max == 0)
567 return 0;
568 while ((max >> shift) >= XA_CHUNK_SIZE)
569 shift += XA_CHUNK_SHIFT;
570 return shift + XA_CHUNK_SHIFT;
571 } else if (xa_is_node(head)) {
572 node = xa_to_node(head);
573 shift = node->shift + XA_CHUNK_SHIFT;
574 }
575 xas->xa_node = NULL;
576
577 while (max > max_index(head)) {
578 xa_mark_t mark = 0;
579
580 XA_NODE_BUG_ON(node, shift > BITS_PER_LONG);
581 node = xas_alloc(xas, shift);
582 if (!node)
583 return -ENOMEM;
584
585 node->count = 1;
586 if (xa_is_value(head))
587 node->nr_values = 1;
588 RCU_INIT_POINTER(node->slots[0], head);
589
590 /* Propagate the aggregated mark info to the new child */
591 for (;;) {
Matthew Wilcox371c7522018-07-04 10:50:12 -0400592 if (xa_track_free(xa) && mark == XA_FREE_MARK) {
593 node_mark_all(node, XA_FREE_MARK);
594 if (!xa_marked(xa, XA_FREE_MARK)) {
595 node_clear_mark(node, 0, XA_FREE_MARK);
596 xa_mark_set(xa, XA_FREE_MARK);
597 }
598 } else if (xa_marked(xa, mark)) {
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500599 node_set_mark(node, 0, mark);
Matthew Wilcox371c7522018-07-04 10:50:12 -0400600 }
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500601 if (mark == XA_MARK_MAX)
602 break;
603 mark_inc(mark);
604 }
605
606 /*
607 * Now that the new node is fully initialised, we can add
608 * it to the tree
609 */
610 if (xa_is_node(head)) {
611 xa_to_node(head)->offset = 0;
612 rcu_assign_pointer(xa_to_node(head)->parent, node);
613 }
614 head = xa_mk_node(node);
615 rcu_assign_pointer(xa->xa_head, head);
616 xas_update(xas, node);
617
618 shift += XA_CHUNK_SHIFT;
619 }
620
621 xas->xa_node = node;
622 return shift;
623}
624
625/*
626 * xas_create() - Create a slot to store an entry in.
627 * @xas: XArray operation state.
Matthew Wilcox76b4e522018-12-28 23:20:44 -0500628 * @allow_root: %true if we can store the entry in the root directly
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500629 *
630 * Most users will not need to call this function directly, as it is called
631 * by xas_store(). It is useful for doing conditional store operations
632 * (see the xa_cmpxchg() implementation for an example).
633 *
634 * Return: If the slot already existed, returns the contents of this slot.
Matthew Wilcox804dfaf2018-11-05 16:37:15 -0500635 * If the slot was newly created, returns %NULL. If it failed to create the
636 * slot, returns %NULL and indicates the error in @xas.
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500637 */
Matthew Wilcox76b4e522018-12-28 23:20:44 -0500638static void *xas_create(struct xa_state *xas, bool allow_root)
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500639{
640 struct xarray *xa = xas->xa;
641 void *entry;
642 void __rcu **slot;
643 struct xa_node *node = xas->xa_node;
644 int shift;
645 unsigned int order = xas->xa_shift;
646
647 if (xas_top(node)) {
648 entry = xa_head_locked(xa);
649 xas->xa_node = NULL;
Matthew Wilcox3ccaf572018-10-26 14:43:22 -0400650 if (!entry && xa_zero_busy(xa))
651 entry = XA_ZERO_ENTRY;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500652 shift = xas_expand(xas, entry);
653 if (shift < 0)
654 return NULL;
Matthew Wilcox76b4e522018-12-28 23:20:44 -0500655 if (!shift && !allow_root)
656 shift = XA_CHUNK_SHIFT;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500657 entry = xa_head_locked(xa);
658 slot = &xa->xa_head;
659 } else if (xas_error(xas)) {
660 return NULL;
661 } else if (node) {
662 unsigned int offset = xas->xa_offset;
663
664 shift = node->shift;
665 entry = xa_entry_locked(xa, node, offset);
666 slot = &node->slots[offset];
667 } else {
668 shift = 0;
669 entry = xa_head_locked(xa);
670 slot = &xa->xa_head;
671 }
672
673 while (shift > order) {
674 shift -= XA_CHUNK_SHIFT;
675 if (!entry) {
676 node = xas_alloc(xas, shift);
677 if (!node)
678 break;
Matthew Wilcox371c7522018-07-04 10:50:12 -0400679 if (xa_track_free(xa))
680 node_mark_all(node, XA_FREE_MARK);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500681 rcu_assign_pointer(*slot, xa_mk_node(node));
682 } else if (xa_is_node(entry)) {
683 node = xa_to_node(entry);
684 } else {
685 break;
686 }
687 entry = xas_descend(xas, node);
688 slot = &node->slots[xas->xa_offset];
689 }
690
691 return entry;
692}
693
Matthew Wilcox2264f512017-12-04 00:11:48 -0500694/**
695 * xas_create_range() - Ensure that stores to this range will succeed
696 * @xas: XArray operation state.
697 *
698 * Creates all of the slots in the range covered by @xas. Sets @xas to
699 * create single-index entries and positions it at the beginning of the
700 * range. This is for the benefit of users which have not yet been
701 * converted to use multi-index entries.
702 */
703void xas_create_range(struct xa_state *xas)
704{
705 unsigned long index = xas->xa_index;
706 unsigned char shift = xas->xa_shift;
707 unsigned char sibs = xas->xa_sibs;
708
Matthew Wilcox (Oracle)84c34df2020-10-13 08:46:29 -0400709 xas->xa_index |= ((sibs + 1UL) << shift) - 1;
Matthew Wilcox2264f512017-12-04 00:11:48 -0500710 if (xas_is_node(xas) && xas->xa_node->shift == xas->xa_shift)
711 xas->xa_offset |= sibs;
712 xas->xa_shift = 0;
713 xas->xa_sibs = 0;
714
715 for (;;) {
Matthew Wilcox76b4e522018-12-28 23:20:44 -0500716 xas_create(xas, true);
Matthew Wilcox2264f512017-12-04 00:11:48 -0500717 if (xas_error(xas))
718 goto restore;
719 if (xas->xa_index <= (index | XA_CHUNK_MASK))
720 goto success;
721 xas->xa_index -= XA_CHUNK_SIZE;
722
723 for (;;) {
724 struct xa_node *node = xas->xa_node;
Matthew Wilcox (Oracle)1ac49c82022-03-28 19:25:11 -0400725 if (node->shift >= shift)
726 break;
Matthew Wilcox2264f512017-12-04 00:11:48 -0500727 xas->xa_node = xa_parent_locked(xas->xa, node);
728 xas->xa_offset = node->offset - 1;
729 if (node->offset != 0)
730 break;
731 }
732 }
733
734restore:
735 xas->xa_shift = shift;
736 xas->xa_sibs = sibs;
737 xas->xa_index = index;
738 return;
739success:
740 xas->xa_index = index;
741 if (xas->xa_node)
742 xas_set_offset(xas);
743}
744EXPORT_SYMBOL_GPL(xas_create_range);
745
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500746static void update_node(struct xa_state *xas, struct xa_node *node,
747 int count, int values)
748{
749 if (!node || (!count && !values))
750 return;
751
752 node->count += count;
753 node->nr_values += values;
754 XA_NODE_BUG_ON(node, node->count > XA_CHUNK_SIZE);
755 XA_NODE_BUG_ON(node, node->nr_values > XA_CHUNK_SIZE);
756 xas_update(xas, node);
757 if (count < 0)
758 xas_delete_node(xas);
759}
760
761/**
762 * xas_store() - Store this entry in the XArray.
763 * @xas: XArray operation state.
764 * @entry: New entry.
765 *
766 * If @xas is operating on a multi-index entry, the entry returned by this
767 * function is essentially meaningless (it may be an internal entry or it
768 * may be %NULL, even if there are non-NULL entries at some of the indices
769 * covered by the range). This is not a problem for any current users,
770 * and can be changed if needed.
771 *
772 * Return: The old entry at this index.
773 */
774void *xas_store(struct xa_state *xas, void *entry)
775{
776 struct xa_node *node;
777 void __rcu **slot = &xas->xa->xa_head;
778 unsigned int offset, max;
779 int count = 0;
780 int values = 0;
781 void *first, *next;
782 bool value = xa_is_value(entry);
783
Matthew Wilcox4a5c8d82019-02-21 17:54:44 -0500784 if (entry) {
785 bool allow_root = !xa_is_node(entry) && !xa_is_zero(entry);
786 first = xas_create(xas, allow_root);
787 } else {
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500788 first = xas_load(xas);
Matthew Wilcox4a5c8d82019-02-21 17:54:44 -0500789 }
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500790
791 if (xas_invalid(xas))
792 return first;
793 node = xas->xa_node;
794 if (node && (xas->xa_shift < node->shift))
795 xas->xa_sibs = 0;
796 if ((first == entry) && !xas->xa_sibs)
797 return first;
798
799 next = first;
800 offset = xas->xa_offset;
801 max = xas->xa_offset + xas->xa_sibs;
802 if (node) {
803 slot = &node->slots[offset];
804 if (xas->xa_sibs)
805 xas_squash_marks(xas);
806 }
807 if (!entry)
808 xas_init_marks(xas);
809
810 for (;;) {
811 /*
812 * Must clear the marks before setting the entry to NULL,
813 * otherwise xas_for_each_marked may find a NULL entry and
814 * stop early. rcu_assign_pointer contains a release barrier
815 * so the mark clearing will appear to happen before the
816 * entry is set to NULL.
817 */
818 rcu_assign_pointer(*slot, entry);
Matthew Wilcox2fbe9672019-02-21 17:36:45 -0500819 if (xa_is_node(next) && (!node || node->shift))
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500820 xas_free_nodes(xas, xa_to_node(next));
821 if (!node)
822 break;
823 count += !next - !entry;
824 values += !xa_is_value(first) - !value;
825 if (entry) {
826 if (offset == max)
827 break;
828 if (!xa_is_sibling(entry))
829 entry = xa_mk_sibling(xas->xa_offset);
830 } else {
831 if (offset == XA_CHUNK_MASK)
832 break;
833 }
834 next = xa_entry_locked(xas->xa, node, ++offset);
835 if (!xa_is_sibling(next)) {
836 if (!entry && (offset > max))
837 break;
838 first = next;
839 }
840 slot++;
841 }
842
843 update_node(xas, node, count, values);
844 return first;
845}
846EXPORT_SYMBOL_GPL(xas_store);
847
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -0500848/**
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500849 * xas_get_mark() - Returns the state of this mark.
850 * @xas: XArray operation state.
851 * @mark: Mark number.
852 *
853 * Return: true if the mark is set, false if the mark is clear or @xas
854 * is in an error state.
855 */
856bool xas_get_mark(const struct xa_state *xas, xa_mark_t mark)
857{
858 if (xas_invalid(xas))
859 return false;
860 if (!xas->xa_node)
861 return xa_marked(xas->xa, mark);
862 return node_get_mark(xas->xa_node, xas->xa_offset, mark);
863}
864EXPORT_SYMBOL_GPL(xas_get_mark);
865
866/**
867 * xas_set_mark() - Sets the mark on this entry and its parents.
868 * @xas: XArray operation state.
869 * @mark: Mark number.
870 *
871 * Sets the specified mark on this entry, and walks up the tree setting it
872 * on all the ancestor entries. Does nothing if @xas has not been walked to
873 * an entry, or is in an error state.
874 */
875void xas_set_mark(const struct xa_state *xas, xa_mark_t mark)
876{
877 struct xa_node *node = xas->xa_node;
878 unsigned int offset = xas->xa_offset;
879
880 if (xas_invalid(xas))
881 return;
882
883 while (node) {
884 if (node_set_mark(node, offset, mark))
885 return;
886 offset = node->offset;
887 node = xa_parent_locked(xas->xa, node);
888 }
889
890 if (!xa_marked(xas->xa, mark))
891 xa_mark_set(xas->xa, mark);
892}
893EXPORT_SYMBOL_GPL(xas_set_mark);
894
895/**
896 * xas_clear_mark() - Clears the mark on this entry and its parents.
897 * @xas: XArray operation state.
898 * @mark: Mark number.
899 *
900 * Clears the specified mark on this entry, and walks back to the head
901 * attempting to clear it on all the ancestor entries. Does nothing if
902 * @xas has not been walked to an entry, or is in an error state.
903 */
904void xas_clear_mark(const struct xa_state *xas, xa_mark_t mark)
905{
906 struct xa_node *node = xas->xa_node;
907 unsigned int offset = xas->xa_offset;
908
909 if (xas_invalid(xas))
910 return;
911
912 while (node) {
913 if (!node_clear_mark(node, offset, mark))
914 return;
915 if (node_any_mark(node, mark))
916 return;
917
918 offset = node->offset;
919 node = xa_parent_locked(xas->xa, node);
920 }
921
922 if (xa_marked(xas->xa, mark))
923 xa_mark_clear(xas->xa, mark);
924}
925EXPORT_SYMBOL_GPL(xas_clear_mark);
926
927/**
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500928 * xas_init_marks() - Initialise all marks for the entry
929 * @xas: Array operations state.
930 *
931 * Initialise all marks for the entry specified by @xas. If we're tracking
932 * free entries with a mark, we need to set it on all entries. All other
933 * marks are cleared.
934 *
935 * This implementation is not as efficient as it could be; we may walk
936 * up the tree multiple times.
937 */
938void xas_init_marks(const struct xa_state *xas)
939{
940 xa_mark_t mark = 0;
941
942 for (;;) {
Matthew Wilcox371c7522018-07-04 10:50:12 -0400943 if (xa_track_free(xas->xa) && mark == XA_FREE_MARK)
944 xas_set_mark(xas, mark);
945 else
946 xas_clear_mark(xas, mark);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500947 if (mark == XA_MARK_MAX)
948 break;
949 mark_inc(mark);
950 }
951}
952EXPORT_SYMBOL_GPL(xas_init_marks);
953
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -0700954#ifdef CONFIG_XARRAY_MULTI
955static unsigned int node_get_marks(struct xa_node *node, unsigned int offset)
956{
957 unsigned int marks = 0;
958 xa_mark_t mark = XA_MARK_0;
959
960 for (;;) {
961 if (node_get_mark(node, offset, mark))
962 marks |= 1 << (__force unsigned int)mark;
963 if (mark == XA_MARK_MAX)
964 break;
965 mark_inc(mark);
966 }
967
968 return marks;
969}
970
971static void node_set_marks(struct xa_node *node, unsigned int offset,
972 struct xa_node *child, unsigned int marks)
973{
974 xa_mark_t mark = XA_MARK_0;
975
976 for (;;) {
977 if (marks & (1 << (__force unsigned int)mark)) {
978 node_set_mark(node, offset, mark);
979 if (child)
980 node_mark_all(child, mark);
981 }
982 if (mark == XA_MARK_MAX)
983 break;
984 mark_inc(mark);
985 }
986}
987
988/**
989 * xas_split_alloc() - Allocate memory for splitting an entry.
990 * @xas: XArray operation state.
991 * @entry: New entry which will be stored in the array.
992 * @order: New entry order.
993 * @gfp: Memory allocation flags.
994 *
995 * This function should be called before calling xas_split().
996 * If necessary, it will allocate new nodes (and fill them with @entry)
997 * to prepare for the upcoming split of an entry of @order size into
998 * entries of the order stored in the @xas.
999 *
1000 * Context: May sleep if @gfp flags permit.
1001 */
1002void xas_split_alloc(struct xa_state *xas, void *entry, unsigned int order,
1003 gfp_t gfp)
1004{
1005 unsigned int sibs = (1 << (order % XA_CHUNK_SHIFT)) - 1;
1006 unsigned int mask = xas->xa_sibs;
1007
1008 /* XXX: no support for splitting really large entries yet */
1009 if (WARN_ON(xas->xa_shift + 2 * XA_CHUNK_SHIFT < order))
1010 goto nomem;
1011 if (xas->xa_shift + XA_CHUNK_SHIFT > order)
1012 return;
1013
1014 do {
1015 unsigned int i;
Matthew Wilcox (Oracle)d99e22c2020-11-19 08:32:31 -05001016 void *sibling = NULL;
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -07001017 struct xa_node *node;
1018
1019 node = kmem_cache_alloc(radix_tree_node_cachep, gfp);
1020 if (!node)
1021 goto nomem;
1022 node->array = xas->xa;
1023 for (i = 0; i < XA_CHUNK_SIZE; i++) {
1024 if ((i & mask) == 0) {
1025 RCU_INIT_POINTER(node->slots[i], entry);
Matthew Wilcox (Oracle)d99e22c2020-11-19 08:32:31 -05001026 sibling = xa_mk_sibling(i);
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -07001027 } else {
1028 RCU_INIT_POINTER(node->slots[i], sibling);
1029 }
1030 }
1031 RCU_INIT_POINTER(node->parent, xas->xa_alloc);
1032 xas->xa_alloc = node;
1033 } while (sibs-- > 0);
1034
1035 return;
1036nomem:
1037 xas_destroy(xas);
1038 xas_set_err(xas, -ENOMEM);
1039}
1040EXPORT_SYMBOL_GPL(xas_split_alloc);
1041
1042/**
1043 * xas_split() - Split a multi-index entry into smaller entries.
1044 * @xas: XArray operation state.
1045 * @entry: New entry to store in the array.
1046 * @order: New entry order.
1047 *
1048 * The value in the entry is copied to all the replacement entries.
1049 *
1050 * Context: Any context. The caller should hold the xa_lock.
1051 */
1052void xas_split(struct xa_state *xas, void *entry, unsigned int order)
1053{
1054 unsigned int sibs = (1 << (order % XA_CHUNK_SHIFT)) - 1;
1055 unsigned int offset, marks;
1056 struct xa_node *node;
1057 void *curr = xas_load(xas);
1058 int values = 0;
1059
1060 node = xas->xa_node;
1061 if (xas_top(node))
1062 return;
1063
1064 marks = node_get_marks(node, xas->xa_offset);
1065
1066 offset = xas->xa_offset + sibs;
1067 do {
1068 if (xas->xa_shift < node->shift) {
1069 struct xa_node *child = xas->xa_alloc;
1070
1071 xas->xa_alloc = rcu_dereference_raw(child->parent);
1072 child->shift = node->shift - XA_CHUNK_SHIFT;
1073 child->offset = offset;
1074 child->count = XA_CHUNK_SIZE;
1075 child->nr_values = xa_is_value(entry) ?
1076 XA_CHUNK_SIZE : 0;
1077 RCU_INIT_POINTER(child->parent, node);
1078 node_set_marks(node, offset, child, marks);
1079 rcu_assign_pointer(node->slots[offset],
1080 xa_mk_node(child));
1081 if (xa_is_value(curr))
1082 values--;
1083 } else {
1084 unsigned int canon = offset - xas->xa_sibs;
1085
1086 node_set_marks(node, canon, NULL, marks);
1087 rcu_assign_pointer(node->slots[canon], entry);
1088 while (offset > canon)
1089 rcu_assign_pointer(node->slots[offset--],
1090 xa_mk_sibling(canon));
1091 values += (xa_is_value(entry) - xa_is_value(curr)) *
1092 (xas->xa_sibs + 1);
1093 }
1094 } while (offset-- > xas->xa_offset);
1095
1096 node->nr_values += values;
1097}
1098EXPORT_SYMBOL_GPL(xas_split);
1099#endif
1100
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001101/**
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001102 * xas_pause() - Pause a walk to drop a lock.
1103 * @xas: XArray operation state.
1104 *
1105 * Some users need to pause a walk and drop the lock they're holding in
1106 * order to yield to a higher priority thread or carry out an operation
1107 * on an entry. Those users should call this function before they drop
1108 * the lock. It resets the @xas to be suitable for the next iteration
1109 * of the loop after the user has reacquired the lock. If most entries
1110 * found during a walk require you to call xas_pause(), the xa_for_each()
1111 * iterator may be more appropriate.
1112 *
1113 * Note that xas_pause() only works for forward iteration. If a user needs
1114 * to pause a reverse iteration, we will need a xas_pause_rev().
1115 */
1116void xas_pause(struct xa_state *xas)
1117{
1118 struct xa_node *node = xas->xa_node;
1119
1120 if (xas_invalid(xas))
1121 return;
1122
Matthew Wilcox (Oracle)82a22312019-11-07 22:49:11 -05001123 xas->xa_node = XAS_RESTART;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001124 if (node) {
Matthew Wilcox (Oracle)c36d4512020-01-31 06:17:09 -05001125 unsigned long offset = xas->xa_offset;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001126 while (++offset < XA_CHUNK_SIZE) {
1127 if (!xa_is_sibling(xa_entry(xas->xa, node, offset)))
1128 break;
1129 }
1130 xas->xa_index += (offset - xas->xa_offset) << node->shift;
Matthew Wilcox (Oracle)82a22312019-11-07 22:49:11 -05001131 if (xas->xa_index == 0)
1132 xas->xa_node = XAS_BOUNDS;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001133 } else {
1134 xas->xa_index++;
1135 }
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001136}
1137EXPORT_SYMBOL_GPL(xas_pause);
1138
Matthew Wilcox64d3e9a2017-12-01 00:06:52 -05001139/*
1140 * __xas_prev() - Find the previous entry in the XArray.
1141 * @xas: XArray operation state.
1142 *
1143 * Helper function for xas_prev() which handles all the complex cases
1144 * out of line.
1145 */
1146void *__xas_prev(struct xa_state *xas)
1147{
1148 void *entry;
1149
1150 if (!xas_frozen(xas->xa_node))
1151 xas->xa_index--;
Matthew Wilcox (Oracle)91abab82019-07-01 17:03:29 -04001152 if (!xas->xa_node)
1153 return set_bounds(xas);
Matthew Wilcox64d3e9a2017-12-01 00:06:52 -05001154 if (xas_not_node(xas->xa_node))
1155 return xas_load(xas);
1156
1157 if (xas->xa_offset != get_offset(xas->xa_index, xas->xa_node))
1158 xas->xa_offset--;
1159
1160 while (xas->xa_offset == 255) {
1161 xas->xa_offset = xas->xa_node->offset - 1;
1162 xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1163 if (!xas->xa_node)
1164 return set_bounds(xas);
1165 }
1166
1167 for (;;) {
1168 entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1169 if (!xa_is_node(entry))
1170 return entry;
1171
1172 xas->xa_node = xa_to_node(entry);
1173 xas_set_offset(xas);
1174 }
1175}
1176EXPORT_SYMBOL_GPL(__xas_prev);
1177
1178/*
1179 * __xas_next() - Find the next entry in the XArray.
1180 * @xas: XArray operation state.
1181 *
1182 * Helper function for xas_next() which handles all the complex cases
1183 * out of line.
1184 */
1185void *__xas_next(struct xa_state *xas)
1186{
1187 void *entry;
1188
1189 if (!xas_frozen(xas->xa_node))
1190 xas->xa_index++;
Matthew Wilcox (Oracle)91abab82019-07-01 17:03:29 -04001191 if (!xas->xa_node)
1192 return set_bounds(xas);
Matthew Wilcox64d3e9a2017-12-01 00:06:52 -05001193 if (xas_not_node(xas->xa_node))
1194 return xas_load(xas);
1195
1196 if (xas->xa_offset != get_offset(xas->xa_index, xas->xa_node))
1197 xas->xa_offset++;
1198
1199 while (xas->xa_offset == XA_CHUNK_SIZE) {
1200 xas->xa_offset = xas->xa_node->offset + 1;
1201 xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1202 if (!xas->xa_node)
1203 return set_bounds(xas);
1204 }
1205
1206 for (;;) {
1207 entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1208 if (!xa_is_node(entry))
1209 return entry;
1210
1211 xas->xa_node = xa_to_node(entry);
1212 xas_set_offset(xas);
1213 }
1214}
1215EXPORT_SYMBOL_GPL(__xas_next);
1216
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001217/**
1218 * xas_find() - Find the next present entry in the XArray.
1219 * @xas: XArray operation state.
1220 * @max: Highest index to return.
1221 *
1222 * If the @xas has not yet been walked to an entry, return the entry
1223 * which has an index >= xas.xa_index. If it has been walked, the entry
1224 * currently being pointed at has been processed, and so we move to the
1225 * next entry.
1226 *
1227 * If no entry is found and the array is smaller than @max, the iterator
1228 * is set to the smallest index not yet in the array. This allows @xas
1229 * to be immediately passed to xas_store().
1230 *
1231 * Return: The entry, if found, otherwise %NULL.
1232 */
1233void *xas_find(struct xa_state *xas, unsigned long max)
1234{
1235 void *entry;
1236
Matthew Wilcox (Oracle)82a22312019-11-07 22:49:11 -05001237 if (xas_error(xas) || xas->xa_node == XAS_BOUNDS)
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001238 return NULL;
Matthew Wilcox (Oracle)c44aa5e2020-01-17 22:13:21 -05001239 if (xas->xa_index > max)
1240 return set_bounds(xas);
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001241
1242 if (!xas->xa_node) {
1243 xas->xa_index = 1;
1244 return set_bounds(xas);
Matthew Wilcox (Oracle)82a22312019-11-07 22:49:11 -05001245 } else if (xas->xa_node == XAS_RESTART) {
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001246 entry = xas_load(xas);
1247 if (entry || xas_not_node(xas->xa_node))
1248 return entry;
1249 } else if (!xas->xa_node->shift &&
1250 xas->xa_offset != (xas->xa_index & XA_CHUNK_MASK)) {
1251 xas->xa_offset = ((xas->xa_index - 1) & XA_CHUNK_MASK) + 1;
1252 }
1253
1254 xas_advance(xas);
1255
1256 while (xas->xa_node && (xas->xa_index <= max)) {
1257 if (unlikely(xas->xa_offset == XA_CHUNK_SIZE)) {
1258 xas->xa_offset = xas->xa_node->offset + 1;
1259 xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1260 continue;
1261 }
1262
1263 entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1264 if (xa_is_node(entry)) {
1265 xas->xa_node = xa_to_node(entry);
1266 xas->xa_offset = 0;
1267 continue;
1268 }
1269 if (entry && !xa_is_sibling(entry))
1270 return entry;
1271
1272 xas_advance(xas);
1273 }
1274
1275 if (!xas->xa_node)
1276 xas->xa_node = XAS_BOUNDS;
1277 return NULL;
1278}
1279EXPORT_SYMBOL_GPL(xas_find);
1280
1281/**
1282 * xas_find_marked() - Find the next marked entry in the XArray.
1283 * @xas: XArray operation state.
1284 * @max: Highest index to return.
1285 * @mark: Mark number to search for.
1286 *
1287 * If the @xas has not yet been walked to an entry, return the marked entry
1288 * which has an index >= xas.xa_index. If it has been walked, the entry
1289 * currently being pointed at has been processed, and so we return the
1290 * first marked entry with an index > xas.xa_index.
1291 *
1292 * If no marked entry is found and the array is smaller than @max, @xas is
1293 * set to the bounds state and xas->xa_index is set to the smallest index
1294 * not yet in the array. This allows @xas to be immediately passed to
1295 * xas_store().
1296 *
1297 * If no entry is found before @max is reached, @xas is set to the restart
1298 * state.
1299 *
1300 * Return: The entry, if found, otherwise %NULL.
1301 */
1302void *xas_find_marked(struct xa_state *xas, unsigned long max, xa_mark_t mark)
1303{
1304 bool advance = true;
1305 unsigned int offset;
1306 void *entry;
1307
1308 if (xas_error(xas))
1309 return NULL;
Matthew Wilcox (Oracle)c44aa5e2020-01-17 22:13:21 -05001310 if (xas->xa_index > max)
1311 goto max;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001312
1313 if (!xas->xa_node) {
1314 xas->xa_index = 1;
1315 goto out;
1316 } else if (xas_top(xas->xa_node)) {
1317 advance = false;
1318 entry = xa_head(xas->xa);
1319 xas->xa_node = NULL;
1320 if (xas->xa_index > max_index(entry))
Matthew Wilcox48483612018-12-13 13:57:42 -05001321 goto out;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001322 if (!xa_is_node(entry)) {
1323 if (xa_marked(xas->xa, mark))
1324 return entry;
1325 xas->xa_index = 1;
1326 goto out;
1327 }
1328 xas->xa_node = xa_to_node(entry);
1329 xas->xa_offset = xas->xa_index >> xas->xa_node->shift;
1330 }
1331
1332 while (xas->xa_index <= max) {
1333 if (unlikely(xas->xa_offset == XA_CHUNK_SIZE)) {
1334 xas->xa_offset = xas->xa_node->offset + 1;
1335 xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1336 if (!xas->xa_node)
1337 break;
1338 advance = false;
1339 continue;
1340 }
1341
1342 if (!advance) {
1343 entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1344 if (xa_is_sibling(entry)) {
1345 xas->xa_offset = xa_to_sibling(entry);
1346 xas_move_index(xas, xas->xa_offset);
1347 }
1348 }
1349
1350 offset = xas_find_chunk(xas, advance, mark);
1351 if (offset > xas->xa_offset) {
1352 advance = false;
1353 xas_move_index(xas, offset);
1354 /* Mind the wrap */
1355 if ((xas->xa_index - 1) >= max)
1356 goto max;
1357 xas->xa_offset = offset;
1358 if (offset == XA_CHUNK_SIZE)
1359 continue;
1360 }
1361
1362 entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
Matthew Wilcox (Oracle)7e934cf2020-03-12 17:29:11 -04001363 if (!entry && !(xa_track_free(xas->xa) && mark == XA_FREE_MARK))
1364 continue;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001365 if (!xa_is_node(entry))
1366 return entry;
1367 xas->xa_node = xa_to_node(entry);
1368 xas_set_offset(xas);
1369 }
1370
1371out:
Matthew Wilcox48483612018-12-13 13:57:42 -05001372 if (xas->xa_index > max)
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001373 goto max;
Matthew Wilcox48483612018-12-13 13:57:42 -05001374 return set_bounds(xas);
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001375max:
1376 xas->xa_node = XAS_RESTART;
1377 return NULL;
1378}
1379EXPORT_SYMBOL_GPL(xas_find_marked);
1380
1381/**
Matthew Wilcox4e99d4e2018-06-01 22:46:02 -04001382 * xas_find_conflict() - Find the next present entry in a range.
1383 * @xas: XArray operation state.
1384 *
1385 * The @xas describes both a range and a position within that range.
1386 *
1387 * Context: Any context. Expects xa_lock to be held.
1388 * Return: The next entry in the range covered by @xas or %NULL.
1389 */
1390void *xas_find_conflict(struct xa_state *xas)
1391{
1392 void *curr;
1393
1394 if (xas_error(xas))
1395 return NULL;
1396
1397 if (!xas->xa_node)
1398 return NULL;
1399
1400 if (xas_top(xas->xa_node)) {
1401 curr = xas_start(xas);
1402 if (!curr)
1403 return NULL;
1404 while (xa_is_node(curr)) {
1405 struct xa_node *node = xa_to_node(curr);
1406 curr = xas_descend(xas, node);
1407 }
1408 if (curr)
1409 return curr;
1410 }
1411
1412 if (xas->xa_node->shift > xas->xa_shift)
1413 return NULL;
1414
1415 for (;;) {
1416 if (xas->xa_node->shift == xas->xa_shift) {
1417 if ((xas->xa_offset & xas->xa_sibs) == xas->xa_sibs)
1418 break;
1419 } else if (xas->xa_offset == XA_CHUNK_MASK) {
1420 xas->xa_offset = xas->xa_node->offset;
1421 xas->xa_node = xa_parent_locked(xas->xa, xas->xa_node);
1422 if (!xas->xa_node)
1423 break;
1424 continue;
1425 }
1426 curr = xa_entry_locked(xas->xa, xas->xa_node, ++xas->xa_offset);
1427 if (xa_is_sibling(curr))
1428 continue;
1429 while (xa_is_node(curr)) {
1430 xas->xa_node = xa_to_node(curr);
1431 xas->xa_offset = 0;
1432 curr = xa_entry_locked(xas->xa, xas->xa_node, 0);
1433 }
1434 if (curr)
1435 return curr;
1436 }
1437 xas->xa_offset -= xas->xa_sibs;
1438 return NULL;
1439}
1440EXPORT_SYMBOL_GPL(xas_find_conflict);
1441
1442/**
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -05001443 * xa_load() - Load an entry from an XArray.
1444 * @xa: XArray.
1445 * @index: index into array.
1446 *
1447 * Context: Any context. Takes and releases the RCU lock.
1448 * Return: The entry at @index in @xa.
1449 */
1450void *xa_load(struct xarray *xa, unsigned long index)
1451{
1452 XA_STATE(xas, xa, index);
1453 void *entry;
1454
1455 rcu_read_lock();
1456 do {
1457 entry = xas_load(&xas);
Matthew Wilcox9f14d4f2018-10-01 14:54:59 -04001458 if (xa_is_zero(entry))
1459 entry = NULL;
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -05001460 } while (xas_retry(&xas, entry));
1461 rcu_read_unlock();
1462
1463 return entry;
1464}
1465EXPORT_SYMBOL(xa_load);
1466
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001467static void *xas_result(struct xa_state *xas, void *curr)
1468{
Matthew Wilcox9f14d4f2018-10-01 14:54:59 -04001469 if (xa_is_zero(curr))
1470 return NULL;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001471 if (xas_error(xas))
1472 curr = xas->xa_node;
1473 return curr;
1474}
1475
1476/**
1477 * __xa_erase() - Erase this entry from the XArray while locked.
1478 * @xa: XArray.
1479 * @index: Index into array.
1480 *
Matthew Wilcox809ab932019-01-26 00:52:26 -05001481 * After this function returns, loading from @index will return %NULL.
1482 * If the index is part of a multi-index entry, all indices will be erased
1483 * and none of the entries will be part of a multi-index entry.
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001484 *
Matthew Wilcox809ab932019-01-26 00:52:26 -05001485 * Context: Any context. Expects xa_lock to be held on entry.
1486 * Return: The entry which used to be at this index.
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001487 */
1488void *__xa_erase(struct xarray *xa, unsigned long index)
1489{
1490 XA_STATE(xas, xa, index);
1491 return xas_result(&xas, xas_store(&xas, NULL));
1492}
Matthew Wilcox9ee5a3b2018-11-01 22:52:06 -04001493EXPORT_SYMBOL(__xa_erase);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001494
1495/**
Matthew Wilcox9c16bb82018-11-05 15:48:49 -05001496 * xa_erase() - Erase this entry from the XArray.
1497 * @xa: XArray.
1498 * @index: Index of entry.
1499 *
Matthew Wilcox809ab932019-01-26 00:52:26 -05001500 * After this function returns, loading from @index will return %NULL.
1501 * If the index is part of a multi-index entry, all indices will be erased
1502 * and none of the entries will be part of a multi-index entry.
Matthew Wilcox9c16bb82018-11-05 15:48:49 -05001503 *
1504 * Context: Any context. Takes and releases the xa_lock.
1505 * Return: The entry which used to be at this index.
1506 */
1507void *xa_erase(struct xarray *xa, unsigned long index)
1508{
1509 void *entry;
1510
1511 xa_lock(xa);
1512 entry = __xa_erase(xa, index);
1513 xa_unlock(xa);
1514
1515 return entry;
1516}
1517EXPORT_SYMBOL(xa_erase);
1518
1519/**
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001520 * __xa_store() - Store this entry in the XArray.
1521 * @xa: XArray.
1522 * @index: Index into array.
1523 * @entry: New entry.
1524 * @gfp: Memory allocation flags.
1525 *
1526 * You must already be holding the xa_lock when calling this function.
1527 * It will drop the lock if needed to allocate memory, and then reacquire
1528 * it afterwards.
1529 *
1530 * Context: Any context. Expects xa_lock to be held on entry. May
1531 * release and reacquire xa_lock if @gfp flags permit.
1532 * Return: The old entry at this index or xa_err() if an error happened.
1533 */
1534void *__xa_store(struct xarray *xa, unsigned long index, void *entry, gfp_t gfp)
1535{
1536 XA_STATE(xas, xa, index);
1537 void *curr;
1538
Matthew Wilcox76b4e522018-12-28 23:20:44 -05001539 if (WARN_ON_ONCE(xa_is_advanced(entry)))
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001540 return XA_ERROR(-EINVAL);
Matthew Wilcoxd9c48042018-11-05 16:15:56 -05001541 if (xa_track_free(xa) && !entry)
1542 entry = XA_ZERO_ENTRY;
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001543
1544 do {
1545 curr = xas_store(&xas, entry);
Matthew Wilcoxd9c48042018-11-05 16:15:56 -05001546 if (xa_track_free(xa))
Matthew Wilcox371c7522018-07-04 10:50:12 -04001547 xas_clear_mark(&xas, XA_FREE_MARK);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -05001548 } while (__xas_nomem(&xas, gfp));
1549
1550 return xas_result(&xas, curr);
1551}
1552EXPORT_SYMBOL(__xa_store);
1553
Matthew Wilcox9b89a032017-11-10 09:34:31 -05001554/**
Matthew Wilcox611f3182018-11-05 15:56:17 -05001555 * xa_store() - Store this entry in the XArray.
1556 * @xa: XArray.
1557 * @index: Index into array.
1558 * @entry: New entry.
1559 * @gfp: Memory allocation flags.
1560 *
1561 * After this function returns, loads from this index will return @entry.
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -07001562 * Storing into an existing multi-index entry updates the entry of every index.
Matthew Wilcox611f3182018-11-05 15:56:17 -05001563 * The marks associated with @index are unaffected unless @entry is %NULL.
1564 *
1565 * Context: Any context. Takes and releases the xa_lock.
1566 * May sleep if the @gfp flags permit.
1567 * Return: The old entry at this index on success, xa_err(-EINVAL) if @entry
1568 * cannot be stored in an XArray, or xa_err(-ENOMEM) if memory allocation
1569 * failed.
1570 */
1571void *xa_store(struct xarray *xa, unsigned long index, void *entry, gfp_t gfp)
1572{
1573 void *curr;
1574
1575 xa_lock(xa);
1576 curr = __xa_store(xa, index, entry, gfp);
1577 xa_unlock(xa);
1578
1579 return curr;
1580}
1581EXPORT_SYMBOL(xa_store);
1582
1583/**
Matthew Wilcox41aec912017-11-10 15:34:55 -05001584 * __xa_cmpxchg() - Store this entry in the XArray.
1585 * @xa: XArray.
1586 * @index: Index into array.
1587 * @old: Old value to test against.
1588 * @entry: New entry.
1589 * @gfp: Memory allocation flags.
1590 *
1591 * You must already be holding the xa_lock when calling this function.
1592 * It will drop the lock if needed to allocate memory, and then reacquire
1593 * it afterwards.
1594 *
1595 * Context: Any context. Expects xa_lock to be held on entry. May
1596 * release and reacquire xa_lock if @gfp flags permit.
1597 * Return: The old entry at this index or xa_err() if an error happened.
1598 */
1599void *__xa_cmpxchg(struct xarray *xa, unsigned long index,
1600 void *old, void *entry, gfp_t gfp)
1601{
1602 XA_STATE(xas, xa, index);
1603 void *curr;
1604
Matthew Wilcox76b4e522018-12-28 23:20:44 -05001605 if (WARN_ON_ONCE(xa_is_advanced(entry)))
Matthew Wilcox41aec912017-11-10 15:34:55 -05001606 return XA_ERROR(-EINVAL);
1607
1608 do {
1609 curr = xas_load(&xas);
Matthew Wilcox371c7522018-07-04 10:50:12 -04001610 if (curr == old) {
Matthew Wilcox41aec912017-11-10 15:34:55 -05001611 xas_store(&xas, entry);
Matthew Wilcoxb38f6c52019-02-20 11:30:49 -05001612 if (xa_track_free(xa) && entry && !curr)
Matthew Wilcox371c7522018-07-04 10:50:12 -04001613 xas_clear_mark(&xas, XA_FREE_MARK);
1614 }
Matthew Wilcox41aec912017-11-10 15:34:55 -05001615 } while (__xas_nomem(&xas, gfp));
1616
1617 return xas_result(&xas, curr);
1618}
1619EXPORT_SYMBOL(__xa_cmpxchg);
1620
1621/**
Matthew Wilcoxb0606fe2019-01-02 13:57:03 -05001622 * __xa_insert() - Store this entry in the XArray if no entry is present.
1623 * @xa: XArray.
1624 * @index: Index into array.
1625 * @entry: New entry.
1626 * @gfp: Memory allocation flags.
1627 *
1628 * Inserting a NULL entry will store a reserved entry (like xa_reserve())
1629 * if no entry is present. Inserting will fail if a reserved entry is
1630 * present, even though loading from this index will return NULL.
1631 *
1632 * Context: Any context. Expects xa_lock to be held on entry. May
1633 * release and reacquire xa_lock if @gfp flags permit.
Matthew Wilcoxfd9dc932019-02-06 13:07:11 -05001634 * Return: 0 if the store succeeded. -EBUSY if another entry was present.
Matthew Wilcoxb0606fe2019-01-02 13:57:03 -05001635 * -ENOMEM if memory could not be allocated.
1636 */
1637int __xa_insert(struct xarray *xa, unsigned long index, void *entry, gfp_t gfp)
1638{
1639 XA_STATE(xas, xa, index);
1640 void *curr;
1641
1642 if (WARN_ON_ONCE(xa_is_advanced(entry)))
1643 return -EINVAL;
1644 if (!entry)
1645 entry = XA_ZERO_ENTRY;
1646
1647 do {
1648 curr = xas_load(&xas);
1649 if (!curr) {
1650 xas_store(&xas, entry);
1651 if (xa_track_free(xa))
1652 xas_clear_mark(&xas, XA_FREE_MARK);
1653 } else {
Matthew Wilcoxfd9dc932019-02-06 13:07:11 -05001654 xas_set_err(&xas, -EBUSY);
Matthew Wilcoxb0606fe2019-01-02 13:57:03 -05001655 }
1656 } while (__xas_nomem(&xas, gfp));
1657
1658 return xas_error(&xas);
1659}
1660EXPORT_SYMBOL(__xa_insert);
1661
Matthew Wilcox0e9446c2018-08-15 14:13:29 -04001662#ifdef CONFIG_XARRAY_MULTI
1663static void xas_set_range(struct xa_state *xas, unsigned long first,
1664 unsigned long last)
1665{
1666 unsigned int shift = 0;
1667 unsigned long sibs = last - first;
1668 unsigned int offset = XA_CHUNK_MASK;
1669
1670 xas_set(xas, first);
1671
1672 while ((first & XA_CHUNK_MASK) == 0) {
1673 if (sibs < XA_CHUNK_MASK)
1674 break;
1675 if ((sibs == XA_CHUNK_MASK) && (offset < XA_CHUNK_MASK))
1676 break;
1677 shift += XA_CHUNK_SHIFT;
1678 if (offset == XA_CHUNK_MASK)
1679 offset = sibs & XA_CHUNK_MASK;
1680 sibs >>= XA_CHUNK_SHIFT;
1681 first >>= XA_CHUNK_SHIFT;
1682 }
1683
1684 offset = first & XA_CHUNK_MASK;
1685 if (offset + sibs > XA_CHUNK_MASK)
1686 sibs = XA_CHUNK_MASK - offset;
1687 if ((((first + sibs + 1) << shift) - 1) > last)
1688 sibs -= 1;
1689
1690 xas->xa_shift = shift;
1691 xas->xa_sibs = sibs;
1692}
1693
1694/**
1695 * xa_store_range() - Store this entry at a range of indices in the XArray.
1696 * @xa: XArray.
1697 * @first: First index to affect.
1698 * @last: Last index to affect.
1699 * @entry: New entry.
1700 * @gfp: Memory allocation flags.
1701 *
1702 * After this function returns, loads from any index between @first and @last,
1703 * inclusive will return @entry.
Matthew Wilcox (Oracle)8fc75642020-10-15 20:05:16 -07001704 * Storing into an existing multi-index entry updates the entry of every index.
Matthew Wilcox0e9446c2018-08-15 14:13:29 -04001705 * The marks associated with @index are unaffected unless @entry is %NULL.
1706 *
1707 * Context: Process context. Takes and releases the xa_lock. May sleep
1708 * if the @gfp flags permit.
1709 * Return: %NULL on success, xa_err(-EINVAL) if @entry cannot be stored in
1710 * an XArray, or xa_err(-ENOMEM) if memory allocation failed.
1711 */
1712void *xa_store_range(struct xarray *xa, unsigned long first,
1713 unsigned long last, void *entry, gfp_t gfp)
1714{
1715 XA_STATE(xas, xa, 0);
1716
1717 if (WARN_ON_ONCE(xa_is_internal(entry)))
1718 return XA_ERROR(-EINVAL);
1719 if (last < first)
1720 return XA_ERROR(-EINVAL);
1721
1722 do {
1723 xas_lock(&xas);
1724 if (entry) {
Matthew Wilcox44a4a662018-11-05 10:53:09 -05001725 unsigned int order = BITS_PER_LONG;
1726 if (last + 1)
1727 order = __ffs(last + 1);
Matthew Wilcox0e9446c2018-08-15 14:13:29 -04001728 xas_set_order(&xas, last, order);
Matthew Wilcox76b4e522018-12-28 23:20:44 -05001729 xas_create(&xas, true);
Matthew Wilcox0e9446c2018-08-15 14:13:29 -04001730 if (xas_error(&xas))
1731 goto unlock;
1732 }
1733 do {
1734 xas_set_range(&xas, first, last);
1735 xas_store(&xas, entry);
1736 if (xas_error(&xas))
1737 goto unlock;
1738 first += xas_size(&xas);
1739 } while (first <= last);
1740unlock:
1741 xas_unlock(&xas);
1742 } while (xas_nomem(&xas, gfp));
1743
1744 return xas_result(&xas, NULL);
1745}
1746EXPORT_SYMBOL(xa_store_range);
Matthew Wilcox (Oracle)57417ce2020-10-15 20:05:13 -07001747
1748/**
1749 * xa_get_order() - Get the order of an entry.
1750 * @xa: XArray.
1751 * @index: Index of the entry.
1752 *
1753 * Return: A number between 0 and 63 indicating the order of the entry.
1754 */
1755int xa_get_order(struct xarray *xa, unsigned long index)
1756{
1757 XA_STATE(xas, xa, index);
1758 void *entry;
1759 int order = 0;
1760
1761 rcu_read_lock();
1762 entry = xas_load(&xas);
1763
1764 if (!entry)
1765 goto unlock;
1766
1767 if (!xas.xa_node)
1768 goto unlock;
1769
1770 for (;;) {
1771 unsigned int slot = xas.xa_offset + (1 << order);
1772
1773 if (slot >= XA_CHUNK_SIZE)
1774 break;
1775 if (!xa_is_sibling(xas.xa_node->slots[slot]))
1776 break;
1777 order++;
1778 }
1779
1780 order += xas.xa_node->shift;
1781unlock:
1782 rcu_read_unlock();
1783
1784 return order;
1785}
1786EXPORT_SYMBOL(xa_get_order);
Matthew Wilcox0e9446c2018-08-15 14:13:29 -04001787#endif /* CONFIG_XARRAY_MULTI */
1788
Matthew Wilcox9f14d4f2018-10-01 14:54:59 -04001789/**
Matthew Wilcox371c7522018-07-04 10:50:12 -04001790 * __xa_alloc() - Find somewhere to store this entry in the XArray.
1791 * @xa: XArray.
1792 * @id: Pointer to ID.
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001793 * @limit: Range for allocated ID.
Matthew Wilcox371c7522018-07-04 10:50:12 -04001794 * @entry: New entry.
1795 * @gfp: Memory allocation flags.
1796 *
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001797 * Finds an empty entry in @xa between @limit.min and @limit.max,
1798 * stores the index into the @id pointer, then stores the entry at
1799 * that index. A concurrent lookup will not see an uninitialised @id.
Matthew Wilcox371c7522018-07-04 10:50:12 -04001800 *
1801 * Context: Any context. Expects xa_lock to be held on entry. May
1802 * release and reacquire xa_lock if @gfp flags permit.
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001803 * Return: 0 on success, -ENOMEM if memory could not be allocated or
1804 * -EBUSY if there are no free entries in @limit.
Matthew Wilcox371c7522018-07-04 10:50:12 -04001805 */
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001806int __xa_alloc(struct xarray *xa, u32 *id, void *entry,
1807 struct xa_limit limit, gfp_t gfp)
Matthew Wilcox371c7522018-07-04 10:50:12 -04001808{
1809 XA_STATE(xas, xa, 0);
Matthew Wilcox371c7522018-07-04 10:50:12 -04001810
Matthew Wilcox76b4e522018-12-28 23:20:44 -05001811 if (WARN_ON_ONCE(xa_is_advanced(entry)))
Matthew Wilcox371c7522018-07-04 10:50:12 -04001812 return -EINVAL;
1813 if (WARN_ON_ONCE(!xa_track_free(xa)))
1814 return -EINVAL;
1815
1816 if (!entry)
1817 entry = XA_ZERO_ENTRY;
1818
1819 do {
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001820 xas.xa_index = limit.min;
1821 xas_find_marked(&xas, limit.max, XA_FREE_MARK);
Matthew Wilcox371c7522018-07-04 10:50:12 -04001822 if (xas.xa_node == XAS_RESTART)
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001823 xas_set_err(&xas, -EBUSY);
1824 else
1825 *id = xas.xa_index;
Matthew Wilcox371c7522018-07-04 10:50:12 -04001826 xas_store(&xas, entry);
1827 xas_clear_mark(&xas, XA_FREE_MARK);
1828 } while (__xas_nomem(&xas, gfp));
1829
Matthew Wilcoxa3e4d3f2018-12-31 10:41:01 -05001830 return xas_error(&xas);
Matthew Wilcox371c7522018-07-04 10:50:12 -04001831}
1832EXPORT_SYMBOL(__xa_alloc);
1833
1834/**
Matthew Wilcox2fa044e2018-11-06 14:13:35 -05001835 * __xa_alloc_cyclic() - Find somewhere to store this entry in the XArray.
1836 * @xa: XArray.
1837 * @id: Pointer to ID.
1838 * @entry: New entry.
1839 * @limit: Range of allocated ID.
1840 * @next: Pointer to next ID to allocate.
1841 * @gfp: Memory allocation flags.
1842 *
1843 * Finds an empty entry in @xa between @limit.min and @limit.max,
1844 * stores the index into the @id pointer, then stores the entry at
1845 * that index. A concurrent lookup will not see an uninitialised @id.
1846 * The search for an empty entry will start at @next and will wrap
1847 * around if necessary.
1848 *
1849 * Context: Any context. Expects xa_lock to be held on entry. May
1850 * release and reacquire xa_lock if @gfp flags permit.
1851 * Return: 0 if the allocation succeeded without wrapping. 1 if the
1852 * allocation succeeded after wrapping, -ENOMEM if memory could not be
1853 * allocated or -EBUSY if there are no free entries in @limit.
1854 */
1855int __xa_alloc_cyclic(struct xarray *xa, u32 *id, void *entry,
1856 struct xa_limit limit, u32 *next, gfp_t gfp)
1857{
1858 u32 min = limit.min;
1859 int ret;
1860
1861 limit.min = max(min, *next);
1862 ret = __xa_alloc(xa, id, entry, limit, gfp);
1863 if ((xa->xa_flags & XA_FLAGS_ALLOC_WRAPPED) && ret == 0) {
1864 xa->xa_flags &= ~XA_FLAGS_ALLOC_WRAPPED;
1865 ret = 1;
1866 }
1867
1868 if (ret < 0 && limit.min > min) {
1869 limit.min = min;
1870 ret = __xa_alloc(xa, id, entry, limit, gfp);
1871 if (ret == 0)
1872 ret = 1;
1873 }
1874
1875 if (ret >= 0) {
1876 *next = *id + 1;
1877 if (*next == 0)
1878 xa->xa_flags |= XA_FLAGS_ALLOC_WRAPPED;
1879 }
1880 return ret;
1881}
1882EXPORT_SYMBOL(__xa_alloc_cyclic);
1883
1884/**
Matthew Wilcox9b89a032017-11-10 09:34:31 -05001885 * __xa_set_mark() - Set this mark on this entry while locked.
1886 * @xa: XArray.
1887 * @index: Index of entry.
1888 * @mark: Mark number.
1889 *
Matthew Wilcox804dfaf2018-11-05 16:37:15 -05001890 * Attempting to set a mark on a %NULL entry does not succeed.
Matthew Wilcox9b89a032017-11-10 09:34:31 -05001891 *
1892 * Context: Any context. Expects xa_lock to be held on entry.
1893 */
1894void __xa_set_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1895{
1896 XA_STATE(xas, xa, index);
1897 void *entry = xas_load(&xas);
1898
1899 if (entry)
1900 xas_set_mark(&xas, mark);
1901}
Matthew Wilcox9ee5a3b2018-11-01 22:52:06 -04001902EXPORT_SYMBOL(__xa_set_mark);
Matthew Wilcox9b89a032017-11-10 09:34:31 -05001903
1904/**
1905 * __xa_clear_mark() - Clear this mark on this entry while locked.
1906 * @xa: XArray.
1907 * @index: Index of entry.
1908 * @mark: Mark number.
1909 *
1910 * Context: Any context. Expects xa_lock to be held on entry.
1911 */
1912void __xa_clear_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1913{
1914 XA_STATE(xas, xa, index);
1915 void *entry = xas_load(&xas);
1916
1917 if (entry)
1918 xas_clear_mark(&xas, mark);
1919}
Matthew Wilcox9ee5a3b2018-11-01 22:52:06 -04001920EXPORT_SYMBOL(__xa_clear_mark);
Matthew Wilcox9b89a032017-11-10 09:34:31 -05001921
1922/**
1923 * xa_get_mark() - Inquire whether this mark is set on this entry.
1924 * @xa: XArray.
1925 * @index: Index of entry.
1926 * @mark: Mark number.
1927 *
1928 * This function uses the RCU read lock, so the result may be out of date
1929 * by the time it returns. If you need the result to be stable, use a lock.
1930 *
1931 * Context: Any context. Takes and releases the RCU lock.
1932 * Return: True if the entry at @index has this mark set, false if it doesn't.
1933 */
1934bool xa_get_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1935{
1936 XA_STATE(xas, xa, index);
1937 void *entry;
1938
1939 rcu_read_lock();
1940 entry = xas_start(&xas);
1941 while (xas_get_mark(&xas, mark)) {
1942 if (!xa_is_node(entry))
1943 goto found;
1944 entry = xas_descend(&xas, xa_to_node(entry));
1945 }
1946 rcu_read_unlock();
1947 return false;
1948 found:
1949 rcu_read_unlock();
1950 return true;
1951}
1952EXPORT_SYMBOL(xa_get_mark);
1953
1954/**
1955 * xa_set_mark() - Set this mark on this entry.
1956 * @xa: XArray.
1957 * @index: Index of entry.
1958 * @mark: Mark number.
1959 *
Matthew Wilcox804dfaf2018-11-05 16:37:15 -05001960 * Attempting to set a mark on a %NULL entry does not succeed.
Matthew Wilcox9b89a032017-11-10 09:34:31 -05001961 *
1962 * Context: Process context. Takes and releases the xa_lock.
1963 */
1964void xa_set_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1965{
1966 xa_lock(xa);
1967 __xa_set_mark(xa, index, mark);
1968 xa_unlock(xa);
1969}
1970EXPORT_SYMBOL(xa_set_mark);
1971
1972/**
1973 * xa_clear_mark() - Clear this mark on this entry.
1974 * @xa: XArray.
1975 * @index: Index of entry.
1976 * @mark: Mark number.
1977 *
1978 * Clearing a mark always succeeds.
1979 *
1980 * Context: Process context. Takes and releases the xa_lock.
1981 */
1982void xa_clear_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1983{
1984 xa_lock(xa);
1985 __xa_clear_mark(xa, index, mark);
1986 xa_unlock(xa);
1987}
1988EXPORT_SYMBOL(xa_clear_mark);
1989
Matthew Wilcoxb803b422017-11-14 08:30:11 -05001990/**
1991 * xa_find() - Search the XArray for an entry.
1992 * @xa: XArray.
1993 * @indexp: Pointer to an index.
1994 * @max: Maximum index to search to.
1995 * @filter: Selection criterion.
1996 *
1997 * Finds the entry in @xa which matches the @filter, and has the lowest
1998 * index that is at least @indexp and no more than @max.
1999 * If an entry is found, @indexp is updated to be the index of the entry.
2000 * This function is protected by the RCU read lock, so it may not find
2001 * entries which are being simultaneously added. It will not return an
2002 * %XA_RETRY_ENTRY; if you need to see retry entries, use xas_find().
2003 *
2004 * Context: Any context. Takes and releases the RCU lock.
2005 * Return: The entry, if found, otherwise %NULL.
2006 */
2007void *xa_find(struct xarray *xa, unsigned long *indexp,
2008 unsigned long max, xa_mark_t filter)
2009{
2010 XA_STATE(xas, xa, *indexp);
2011 void *entry;
2012
2013 rcu_read_lock();
2014 do {
2015 if ((__force unsigned int)filter < XA_MAX_MARKS)
2016 entry = xas_find_marked(&xas, max, filter);
2017 else
2018 entry = xas_find(&xas, max);
2019 } while (xas_retry(&xas, entry));
2020 rcu_read_unlock();
2021
2022 if (entry)
2023 *indexp = xas.xa_index;
2024 return entry;
2025}
2026EXPORT_SYMBOL(xa_find);
2027
Matthew Wilcox (Oracle)19c30f42020-01-17 22:00:41 -05002028static bool xas_sibling(struct xa_state *xas)
2029{
2030 struct xa_node *node = xas->xa_node;
2031 unsigned long mask;
2032
Matthew Wilcox (Oracle)d8e93e32020-02-27 07:37:40 -05002033 if (!IS_ENABLED(CONFIG_XARRAY_MULTI) || !node)
Matthew Wilcox (Oracle)19c30f42020-01-17 22:00:41 -05002034 return false;
2035 mask = (XA_CHUNK_SIZE << node->shift) - 1;
Matthew Wilcox (Oracle)bd40b172020-01-31 05:07:55 -05002036 return (xas->xa_index & mask) >
2037 ((unsigned long)xas->xa_offset << node->shift);
Matthew Wilcox (Oracle)19c30f42020-01-17 22:00:41 -05002038}
2039
Matthew Wilcoxb803b422017-11-14 08:30:11 -05002040/**
2041 * xa_find_after() - Search the XArray for a present entry.
2042 * @xa: XArray.
2043 * @indexp: Pointer to an index.
2044 * @max: Maximum index to search to.
2045 * @filter: Selection criterion.
2046 *
2047 * Finds the entry in @xa which matches the @filter and has the lowest
2048 * index that is above @indexp and no more than @max.
2049 * If an entry is found, @indexp is updated to be the index of the entry.
2050 * This function is protected by the RCU read lock, so it may miss entries
2051 * which are being simultaneously added. It will not return an
2052 * %XA_RETRY_ENTRY; if you need to see retry entries, use xas_find().
2053 *
2054 * Context: Any context. Takes and releases the RCU lock.
2055 * Return: The pointer, if found, otherwise %NULL.
2056 */
2057void *xa_find_after(struct xarray *xa, unsigned long *indexp,
2058 unsigned long max, xa_mark_t filter)
2059{
2060 XA_STATE(xas, xa, *indexp + 1);
2061 void *entry;
2062
Matthew Wilcox (Oracle)430f24f2020-01-17 17:45:12 -05002063 if (xas.xa_index == 0)
2064 return NULL;
2065
Matthew Wilcoxb803b422017-11-14 08:30:11 -05002066 rcu_read_lock();
2067 for (;;) {
2068 if ((__force unsigned int)filter < XA_MAX_MARKS)
2069 entry = xas_find_marked(&xas, max, filter);
2070 else
2071 entry = xas_find(&xas, max);
Matthew Wilcox (Oracle)c44aa5e2020-01-17 22:13:21 -05002072
2073 if (xas_invalid(&xas))
Matthew Wilcox8229706e2018-11-01 16:55:19 -04002074 break;
Matthew Wilcox (Oracle)19c30f42020-01-17 22:00:41 -05002075 if (xas_sibling(&xas))
2076 continue;
Matthew Wilcoxb803b422017-11-14 08:30:11 -05002077 if (!xas_retry(&xas, entry))
2078 break;
2079 }
2080 rcu_read_unlock();
2081
2082 if (entry)
2083 *indexp = xas.xa_index;
2084 return entry;
2085}
2086EXPORT_SYMBOL(xa_find_after);
2087
Matthew Wilcox80a0a1a2017-11-14 16:42:22 -05002088static unsigned int xas_extract_present(struct xa_state *xas, void **dst,
2089 unsigned long max, unsigned int n)
2090{
2091 void *entry;
2092 unsigned int i = 0;
2093
2094 rcu_read_lock();
2095 xas_for_each(xas, entry, max) {
2096 if (xas_retry(xas, entry))
2097 continue;
2098 dst[i++] = entry;
2099 if (i == n)
2100 break;
2101 }
2102 rcu_read_unlock();
2103
2104 return i;
2105}
2106
2107static unsigned int xas_extract_marked(struct xa_state *xas, void **dst,
2108 unsigned long max, unsigned int n, xa_mark_t mark)
2109{
2110 void *entry;
2111 unsigned int i = 0;
2112
2113 rcu_read_lock();
2114 xas_for_each_marked(xas, entry, max, mark) {
2115 if (xas_retry(xas, entry))
2116 continue;
2117 dst[i++] = entry;
2118 if (i == n)
2119 break;
2120 }
2121 rcu_read_unlock();
2122
2123 return i;
2124}
2125
2126/**
2127 * xa_extract() - Copy selected entries from the XArray into a normal array.
2128 * @xa: The source XArray to copy from.
2129 * @dst: The buffer to copy entries into.
2130 * @start: The first index in the XArray eligible to be selected.
2131 * @max: The last index in the XArray eligible to be selected.
2132 * @n: The maximum number of entries to copy.
2133 * @filter: Selection criterion.
2134 *
2135 * Copies up to @n entries that match @filter from the XArray. The
2136 * copied entries will have indices between @start and @max, inclusive.
2137 *
2138 * The @filter may be an XArray mark value, in which case entries which are
2139 * marked with that mark will be copied. It may also be %XA_PRESENT, in
Matthew Wilcox804dfaf2018-11-05 16:37:15 -05002140 * which case all entries which are not %NULL will be copied.
Matthew Wilcox80a0a1a2017-11-14 16:42:22 -05002141 *
2142 * The entries returned may not represent a snapshot of the XArray at a
2143 * moment in time. For example, if another thread stores to index 5, then
2144 * index 10, calling xa_extract() may return the old contents of index 5
2145 * and the new contents of index 10. Indices not modified while this
2146 * function is running will not be skipped.
2147 *
2148 * If you need stronger guarantees, holding the xa_lock across calls to this
2149 * function will prevent concurrent modification.
2150 *
2151 * Context: Any context. Takes and releases the RCU lock.
2152 * Return: The number of entries copied.
2153 */
2154unsigned int xa_extract(struct xarray *xa, void **dst, unsigned long start,
2155 unsigned long max, unsigned int n, xa_mark_t filter)
2156{
2157 XA_STATE(xas, xa, start);
2158
2159 if (!n)
2160 return 0;
2161
2162 if ((__force unsigned int)filter < XA_MAX_MARKS)
2163 return xas_extract_marked(&xas, dst, max, n, filter);
2164 return xas_extract_present(&xas, dst, max, n);
2165}
2166EXPORT_SYMBOL(xa_extract);
2167
Matthew Wilcox687149f2017-11-17 08:16:34 -05002168/**
Matthew Wilcox (Oracle)f82cd2f2020-08-18 09:05:56 -04002169 * xa_delete_node() - Private interface for workingset code.
2170 * @node: Node to be removed from the tree.
2171 * @update: Function to call to update ancestor nodes.
2172 *
2173 * Context: xa_lock must be held on entry and will not be released.
2174 */
2175void xa_delete_node(struct xa_node *node, xa_update_node_t update)
2176{
2177 struct xa_state xas = {
2178 .xa = node->array,
2179 .xa_index = (unsigned long)node->offset <<
2180 (node->shift + XA_CHUNK_SHIFT),
2181 .xa_shift = node->shift + XA_CHUNK_SHIFT,
2182 .xa_offset = node->offset,
2183 .xa_node = xa_parent_locked(node->array, node),
2184 .xa_update = update,
2185 };
2186
2187 xas_store(&xas, NULL);
2188}
2189EXPORT_SYMBOL_GPL(xa_delete_node); /* For the benefit of the test suite */
2190
2191/**
Matthew Wilcox687149f2017-11-17 08:16:34 -05002192 * xa_destroy() - Free all internal data structures.
2193 * @xa: XArray.
2194 *
2195 * After calling this function, the XArray is empty and has freed all memory
2196 * allocated for its internal data structures. You are responsible for
2197 * freeing the objects referenced by the XArray.
2198 *
2199 * Context: Any context. Takes and releases the xa_lock, interrupt-safe.
2200 */
2201void xa_destroy(struct xarray *xa)
2202{
2203 XA_STATE(xas, xa, 0);
2204 unsigned long flags;
2205 void *entry;
2206
2207 xas.xa_node = NULL;
2208 xas_lock_irqsave(&xas, flags);
2209 entry = xa_head_locked(xa);
2210 RCU_INIT_POINTER(xa->xa_head, NULL);
2211 xas_init_marks(&xas);
Matthew Wilcox3ccaf572018-10-26 14:43:22 -04002212 if (xa_zero_busy(xa))
2213 xa_mark_clear(xa, XA_FREE_MARK);
Matthew Wilcox687149f2017-11-17 08:16:34 -05002214 /* lockdep checks we're still holding the lock in xas_free_nodes() */
2215 if (xa_is_node(entry))
2216 xas_free_nodes(&xas, xa_to_node(entry));
2217 xas_unlock_irqrestore(&xas, flags);
2218}
2219EXPORT_SYMBOL(xa_destroy);
2220
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -05002221#ifdef XA_DEBUG
2222void xa_dump_node(const struct xa_node *node)
2223{
2224 unsigned i, j;
2225
2226 if (!node)
2227 return;
2228 if ((unsigned long)node & 3) {
2229 pr_cont("node %px\n", node);
2230 return;
2231 }
2232
2233 pr_cont("node %px %s %d parent %px shift %d count %d values %d "
2234 "array %px list %px %px marks",
2235 node, node->parent ? "offset" : "max", node->offset,
2236 node->parent, node->shift, node->count, node->nr_values,
2237 node->array, node->private_list.prev, node->private_list.next);
2238 for (i = 0; i < XA_MAX_MARKS; i++)
2239 for (j = 0; j < XA_MARK_LONGS; j++)
2240 pr_cont(" %lx", node->marks[i][j]);
2241 pr_cont("\n");
2242}
2243
2244void xa_dump_index(unsigned long index, unsigned int shift)
2245{
2246 if (!shift)
2247 pr_info("%lu: ", index);
2248 else if (shift >= BITS_PER_LONG)
2249 pr_info("0-%lu: ", ~0UL);
2250 else
2251 pr_info("%lu-%lu: ", index, index | ((1UL << shift) - 1));
2252}
2253
2254void xa_dump_entry(const void *entry, unsigned long index, unsigned long shift)
2255{
2256 if (!entry)
2257 return;
2258
2259 xa_dump_index(index, shift);
2260
2261 if (xa_is_node(entry)) {
2262 if (shift == 0) {
2263 pr_cont("%px\n", entry);
2264 } else {
2265 unsigned long i;
2266 struct xa_node *node = xa_to_node(entry);
2267 xa_dump_node(node);
2268 for (i = 0; i < XA_CHUNK_SIZE; i++)
2269 xa_dump_entry(node->slots[i],
2270 index + (i << node->shift), node->shift);
2271 }
2272 } else if (xa_is_value(entry))
2273 pr_cont("value %ld (0x%lx) [%px]\n", xa_to_value(entry),
2274 xa_to_value(entry), entry);
2275 else if (!xa_is_internal(entry))
2276 pr_cont("%px\n", entry);
2277 else if (xa_is_retry(entry))
2278 pr_cont("retry (%ld)\n", xa_to_internal(entry));
2279 else if (xa_is_sibling(entry))
2280 pr_cont("sibling (slot %ld)\n", xa_to_sibling(entry));
Matthew Wilcox9f14d4f2018-10-01 14:54:59 -04002281 else if (xa_is_zero(entry))
2282 pr_cont("zero (%ld)\n", xa_to_internal(entry));
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -05002283 else
2284 pr_cont("UNKNOWN ENTRY (%px)\n", entry);
2285}
2286
2287void xa_dump(const struct xarray *xa)
2288{
2289 void *entry = xa->xa_head;
2290 unsigned int shift = 0;
2291
2292 pr_info("xarray: %px head %px flags %x marks %d %d %d\n", xa, entry,
Matthew Wilcox9b89a032017-11-10 09:34:31 -05002293 xa->xa_flags, xa_marked(xa, XA_MARK_0),
2294 xa_marked(xa, XA_MARK_1), xa_marked(xa, XA_MARK_2));
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -05002295 if (xa_is_node(entry))
2296 shift = xa_to_node(entry)->shift + XA_CHUNK_SHIFT;
2297 xa_dump_entry(entry, 0, shift);
2298}
2299#endif