xref: /linux-6.15/lib/xarray.c (revision 97db889b)
1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3  * XArray implementation
4  * Copyright (c) 2017-2018 Microsoft Corporation
5  * Copyright (c) 2018-2020 Oracle
6  * Author: Matthew Wilcox <[email protected]>
7  */
8 
9 #include <linux/bitmap.h>
10 #include <linux/export.h>
11 #include <linux/list.h>
12 #include <linux/slab.h>
13 #include <linux/xarray.h>
14 
15 #include "radix-tree.h"
16 
17 /*
18  * Coding conventions in this file:
19  *
20  * @xa is used to refer to the entire xarray.
21  * @xas is the 'xarray operation state'.  It may be either a pointer to
22  * an xa_state, or an xa_state stored on the stack.  This is an unfortunate
23  * ambiguity.
24  * @index is the index of the entry being operated on
25  * @mark is an xa_mark_t; a small number indicating one of the mark bits.
26  * @node refers to an xa_node; usually the primary one being operated on by
27  * this function.
28  * @offset is the index into the slots array inside an xa_node.
29  * @parent refers to the @xa_node closer to the head than @node.
30  * @entry refers to something stored in a slot in the xarray
31  */
32 
33 static inline unsigned int xa_lock_type(const struct xarray *xa)
34 {
35 	return (__force unsigned int)xa->xa_flags & 3;
36 }
37 
38 static inline void xas_lock_type(struct xa_state *xas, unsigned int lock_type)
39 {
40 	if (lock_type == XA_LOCK_IRQ)
41 		xas_lock_irq(xas);
42 	else if (lock_type == XA_LOCK_BH)
43 		xas_lock_bh(xas);
44 	else
45 		xas_lock(xas);
46 }
47 
48 static inline void xas_unlock_type(struct xa_state *xas, unsigned int lock_type)
49 {
50 	if (lock_type == XA_LOCK_IRQ)
51 		xas_unlock_irq(xas);
52 	else if (lock_type == XA_LOCK_BH)
53 		xas_unlock_bh(xas);
54 	else
55 		xas_unlock(xas);
56 }
57 
58 static inline bool xa_track_free(const struct xarray *xa)
59 {
60 	return xa->xa_flags & XA_FLAGS_TRACK_FREE;
61 }
62 
63 static inline bool xa_zero_busy(const struct xarray *xa)
64 {
65 	return xa->xa_flags & XA_FLAGS_ZERO_BUSY;
66 }
67 
68 static inline void xa_mark_set(struct xarray *xa, xa_mark_t mark)
69 {
70 	if (!(xa->xa_flags & XA_FLAGS_MARK(mark)))
71 		xa->xa_flags |= XA_FLAGS_MARK(mark);
72 }
73 
74 static inline void xa_mark_clear(struct xarray *xa, xa_mark_t mark)
75 {
76 	if (xa->xa_flags & XA_FLAGS_MARK(mark))
77 		xa->xa_flags &= ~(XA_FLAGS_MARK(mark));
78 }
79 
80 static inline unsigned long *node_marks(struct xa_node *node, xa_mark_t mark)
81 {
82 	return node->marks[(__force unsigned)mark];
83 }
84 
85 static inline bool node_get_mark(struct xa_node *node,
86 		unsigned int offset, xa_mark_t mark)
87 {
88 	return test_bit(offset, node_marks(node, mark));
89 }
90 
91 /* returns true if the bit was set */
92 static inline bool node_set_mark(struct xa_node *node, unsigned int offset,
93 				xa_mark_t mark)
94 {
95 	return __test_and_set_bit(offset, node_marks(node, mark));
96 }
97 
98 /* returns true if the bit was set */
99 static inline bool node_clear_mark(struct xa_node *node, unsigned int offset,
100 				xa_mark_t mark)
101 {
102 	return __test_and_clear_bit(offset, node_marks(node, mark));
103 }
104 
105 static inline bool node_any_mark(struct xa_node *node, xa_mark_t mark)
106 {
107 	return !bitmap_empty(node_marks(node, mark), XA_CHUNK_SIZE);
108 }
109 
110 static inline void node_mark_all(struct xa_node *node, xa_mark_t mark)
111 {
112 	bitmap_fill(node_marks(node, mark), XA_CHUNK_SIZE);
113 }
114 
115 #define mark_inc(mark) do { \
116 	mark = (__force xa_mark_t)((__force unsigned)(mark) + 1); \
117 } while (0)
118 
119 /*
120  * xas_squash_marks() - Merge all marks to the first entry
121  * @xas: Array operation state.
122  *
123  * Set a mark on the first entry if any entry has it set.  Clear marks on
124  * all sibling entries.
125  */
126 static void xas_squash_marks(const struct xa_state *xas)
127 {
128 	unsigned int mark = 0;
129 	unsigned int limit = xas->xa_offset + xas->xa_sibs + 1;
130 
131 	if (!xas->xa_sibs)
132 		return;
133 
134 	do {
135 		unsigned long *marks = xas->xa_node->marks[mark];
136 		if (find_next_bit(marks, limit, xas->xa_offset + 1) == limit)
137 			continue;
138 		__set_bit(xas->xa_offset, marks);
139 		bitmap_clear(marks, xas->xa_offset + 1, xas->xa_sibs);
140 	} while (mark++ != (__force unsigned)XA_MARK_MAX);
141 }
142 
143 /* extracts the offset within this node from the index */
144 static unsigned int get_offset(unsigned long index, struct xa_node *node)
145 {
146 	return (index >> node->shift) & XA_CHUNK_MASK;
147 }
148 
149 static void xas_set_offset(struct xa_state *xas)
150 {
151 	xas->xa_offset = get_offset(xas->xa_index, xas->xa_node);
152 }
153 
154 /* move the index either forwards (find) or backwards (sibling slot) */
155 static void xas_move_index(struct xa_state *xas, unsigned long offset)
156 {
157 	unsigned int shift = xas->xa_node->shift;
158 	xas->xa_index &= ~XA_CHUNK_MASK << shift;
159 	xas->xa_index += offset << shift;
160 }
161 
162 static void xas_next_offset(struct xa_state *xas)
163 {
164 	xas->xa_offset++;
165 	xas_move_index(xas, xas->xa_offset);
166 }
167 
168 static void *set_bounds(struct xa_state *xas)
169 {
170 	xas->xa_node = XAS_BOUNDS;
171 	return NULL;
172 }
173 
174 /*
175  * Starts a walk.  If the @xas is already valid, we assume that it's on
176  * the right path and just return where we've got to.  If we're in an
177  * error state, return NULL.  If the index is outside the current scope
178  * of the xarray, return NULL without changing @xas->xa_node.  Otherwise
179  * set @xas->xa_node to NULL and return the current head of the array.
180  */
181 static void *xas_start(struct xa_state *xas)
182 {
183 	void *entry;
184 
185 	if (xas_valid(xas))
186 		return xas_reload(xas);
187 	if (xas_error(xas))
188 		return NULL;
189 
190 	entry = xa_head(xas->xa);
191 	if (!xa_is_node(entry)) {
192 		if (xas->xa_index)
193 			return set_bounds(xas);
194 	} else {
195 		if ((xas->xa_index >> xa_to_node(entry)->shift) > XA_CHUNK_MASK)
196 			return set_bounds(xas);
197 	}
198 
199 	xas->xa_node = NULL;
200 	return entry;
201 }
202 
203 static __always_inline void *xas_descend(struct xa_state *xas,
204 					struct xa_node *node)
205 {
206 	unsigned int offset = get_offset(xas->xa_index, node);
207 	void *entry = xa_entry(xas->xa, node, offset);
208 
209 	xas->xa_node = node;
210 	while (xa_is_sibling(entry)) {
211 		offset = xa_to_sibling(entry);
212 		entry = xa_entry(xas->xa, node, offset);
213 		if (node->shift && xa_is_node(entry))
214 			entry = XA_RETRY_ENTRY;
215 	}
216 
217 	xas->xa_offset = offset;
218 	return entry;
219 }
220 
221 /**
222  * xas_load() - Load an entry from the XArray (advanced).
223  * @xas: XArray operation state.
224  *
225  * Usually walks the @xas to the appropriate state to load the entry
226  * stored at xa_index.  However, it will do nothing and return %NULL if
227  * @xas is in an error state.  xas_load() will never expand the tree.
228  *
229  * If the xa_state is set up to operate on a multi-index entry, xas_load()
230  * may return %NULL or an internal entry, even if there are entries
231  * present within the range specified by @xas.
232  *
233  * Context: Any context.  The caller should hold the xa_lock or the RCU lock.
234  * Return: Usually an entry in the XArray, but see description for exceptions.
235  */
236 void *xas_load(struct xa_state *xas)
237 {
238 	void *entry = xas_start(xas);
239 
240 	while (xa_is_node(entry)) {
241 		struct xa_node *node = xa_to_node(entry);
242 
243 		if (xas->xa_shift > node->shift)
244 			break;
245 		entry = xas_descend(xas, node);
246 		if (node->shift == 0)
247 			break;
248 	}
249 	return entry;
250 }
251 EXPORT_SYMBOL_GPL(xas_load);
252 
253 #define XA_RCU_FREE	((struct xarray *)1)
254 
255 static void xa_node_free(struct xa_node *node)
256 {
257 	XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
258 	node->array = XA_RCU_FREE;
259 	call_rcu(&node->rcu_head, radix_tree_node_rcu_free);
260 }
261 
262 /*
263  * xas_destroy() - Free any resources allocated during the XArray operation.
264  * @xas: XArray operation state.
265  *
266  * Most users will not need to call this function; it is called for you
267  * by xas_nomem().
268  */
269 void xas_destroy(struct xa_state *xas)
270 {
271 	struct xa_node *next, *node = xas->xa_alloc;
272 
273 	while (node) {
274 		XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
275 		next = rcu_dereference_raw(node->parent);
276 		radix_tree_node_rcu_free(&node->rcu_head);
277 		xas->xa_alloc = node = next;
278 	}
279 }
280 
281 /**
282  * xas_nomem() - Allocate memory if needed.
283  * @xas: XArray operation state.
284  * @gfp: Memory allocation flags.
285  *
286  * If we need to add new nodes to the XArray, we try to allocate memory
287  * with GFP_NOWAIT while holding the lock, which will usually succeed.
288  * If it fails, @xas is flagged as needing memory to continue.  The caller
289  * should drop the lock and call xas_nomem().  If xas_nomem() succeeds,
290  * the caller should retry the operation.
291  *
292  * Forward progress is guaranteed as one node is allocated here and
293  * stored in the xa_state where it will be found by xas_alloc().  More
294  * nodes will likely be found in the slab allocator, but we do not tie
295  * them up here.
296  *
297  * Return: true if memory was needed, and was successfully allocated.
298  */
299 bool xas_nomem(struct xa_state *xas, gfp_t gfp)
300 {
301 	if (xas->xa_node != XA_ERROR(-ENOMEM)) {
302 		xas_destroy(xas);
303 		return false;
304 	}
305 	if (xas->xa->xa_flags & XA_FLAGS_ACCOUNT)
306 		gfp |= __GFP_ACCOUNT;
307 	xas->xa_alloc = kmem_cache_alloc_lru(radix_tree_node_cachep, xas->xa_lru, gfp);
308 	if (!xas->xa_alloc)
309 		return false;
310 	xas->xa_alloc->parent = NULL;
311 	XA_NODE_BUG_ON(xas->xa_alloc, !list_empty(&xas->xa_alloc->private_list));
312 	xas->xa_node = XAS_RESTART;
313 	return true;
314 }
315 EXPORT_SYMBOL_GPL(xas_nomem);
316 
317 /*
318  * __xas_nomem() - Drop locks and allocate memory if needed.
319  * @xas: XArray operation state.
320  * @gfp: Memory allocation flags.
321  *
322  * Internal variant of xas_nomem().
323  *
324  * Return: true if memory was needed, and was successfully allocated.
325  */
326 static bool __xas_nomem(struct xa_state *xas, gfp_t gfp)
327 	__must_hold(xas->xa->xa_lock)
328 {
329 	unsigned int lock_type = xa_lock_type(xas->xa);
330 
331 	if (xas->xa_node != XA_ERROR(-ENOMEM)) {
332 		xas_destroy(xas);
333 		return false;
334 	}
335 	if (xas->xa->xa_flags & XA_FLAGS_ACCOUNT)
336 		gfp |= __GFP_ACCOUNT;
337 	if (gfpflags_allow_blocking(gfp)) {
338 		xas_unlock_type(xas, lock_type);
339 		xas->xa_alloc = kmem_cache_alloc_lru(radix_tree_node_cachep, xas->xa_lru, gfp);
340 		xas_lock_type(xas, lock_type);
341 	} else {
342 		xas->xa_alloc = kmem_cache_alloc_lru(radix_tree_node_cachep, xas->xa_lru, gfp);
343 	}
344 	if (!xas->xa_alloc)
345 		return false;
346 	xas->xa_alloc->parent = NULL;
347 	XA_NODE_BUG_ON(xas->xa_alloc, !list_empty(&xas->xa_alloc->private_list));
348 	xas->xa_node = XAS_RESTART;
349 	return true;
350 }
351 
352 static void xas_update(struct xa_state *xas, struct xa_node *node)
353 {
354 	if (xas->xa_update)
355 		xas->xa_update(node);
356 	else
357 		XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
358 }
359 
360 static void *xas_alloc(struct xa_state *xas, unsigned int shift)
361 {
362 	struct xa_node *parent = xas->xa_node;
363 	struct xa_node *node = xas->xa_alloc;
364 
365 	if (xas_invalid(xas))
366 		return NULL;
367 
368 	if (node) {
369 		xas->xa_alloc = NULL;
370 	} else {
371 		gfp_t gfp = GFP_NOWAIT | __GFP_NOWARN;
372 
373 		if (xas->xa->xa_flags & XA_FLAGS_ACCOUNT)
374 			gfp |= __GFP_ACCOUNT;
375 
376 		node = kmem_cache_alloc_lru(radix_tree_node_cachep, xas->xa_lru, gfp);
377 		if (!node) {
378 			xas_set_err(xas, -ENOMEM);
379 			return NULL;
380 		}
381 	}
382 
383 	if (parent) {
384 		node->offset = xas->xa_offset;
385 		parent->count++;
386 		XA_NODE_BUG_ON(node, parent->count > XA_CHUNK_SIZE);
387 		xas_update(xas, parent);
388 	}
389 	XA_NODE_BUG_ON(node, shift > BITS_PER_LONG);
390 	XA_NODE_BUG_ON(node, !list_empty(&node->private_list));
391 	node->shift = shift;
392 	node->count = 0;
393 	node->nr_values = 0;
394 	RCU_INIT_POINTER(node->parent, xas->xa_node);
395 	node->array = xas->xa;
396 
397 	return node;
398 }
399 
400 #ifdef CONFIG_XARRAY_MULTI
401 /* Returns the number of indices covered by a given xa_state */
402 static unsigned long xas_size(const struct xa_state *xas)
403 {
404 	return (xas->xa_sibs + 1UL) << xas->xa_shift;
405 }
406 #endif
407 
408 /*
409  * Use this to calculate the maximum index that will need to be created
410  * in order to add the entry described by @xas.  Because we cannot store a
411  * multi-index entry at index 0, the calculation is a little more complex
412  * than you might expect.
413  */
414 static unsigned long xas_max(struct xa_state *xas)
415 {
416 	unsigned long max = xas->xa_index;
417 
418 #ifdef CONFIG_XARRAY_MULTI
419 	if (xas->xa_shift || xas->xa_sibs) {
420 		unsigned long mask = xas_size(xas) - 1;
421 		max |= mask;
422 		if (mask == max)
423 			max++;
424 	}
425 #endif
426 
427 	return max;
428 }
429 
430 /* The maximum index that can be contained in the array without expanding it */
431 static unsigned long max_index(void *entry)
432 {
433 	if (!xa_is_node(entry))
434 		return 0;
435 	return (XA_CHUNK_SIZE << xa_to_node(entry)->shift) - 1;
436 }
437 
438 static inline void *xa_zero_to_null(void *entry)
439 {
440 	return xa_is_zero(entry) ? NULL : entry;
441 }
442 
443 static void xas_shrink(struct xa_state *xas)
444 {
445 	struct xarray *xa = xas->xa;
446 	struct xa_node *node = xas->xa_node;
447 
448 	for (;;) {
449 		void *entry;
450 
451 		XA_NODE_BUG_ON(node, node->count > XA_CHUNK_SIZE);
452 		if (node->count != 1)
453 			break;
454 		entry = xa_entry_locked(xa, node, 0);
455 		if (!entry)
456 			break;
457 		if (!xa_is_node(entry) && node->shift)
458 			break;
459 		if (xa_zero_busy(xa))
460 			entry = xa_zero_to_null(entry);
461 		xas->xa_node = XAS_BOUNDS;
462 
463 		RCU_INIT_POINTER(xa->xa_head, entry);
464 		if (xa_track_free(xa) && !node_get_mark(node, 0, XA_FREE_MARK))
465 			xa_mark_clear(xa, XA_FREE_MARK);
466 
467 		node->count = 0;
468 		node->nr_values = 0;
469 		if (!xa_is_node(entry))
470 			RCU_INIT_POINTER(node->slots[0], XA_RETRY_ENTRY);
471 		xas_update(xas, node);
472 		xa_node_free(node);
473 		if (!xa_is_node(entry))
474 			break;
475 		node = xa_to_node(entry);
476 		node->parent = NULL;
477 	}
478 }
479 
480 /*
481  * xas_delete_node() - Attempt to delete an xa_node
482  * @xas: Array operation state.
483  *
484  * Attempts to delete the @xas->xa_node.  This will fail if xa->node has
485  * a non-zero reference count.
486  */
487 static void xas_delete_node(struct xa_state *xas)
488 {
489 	struct xa_node *node = xas->xa_node;
490 
491 	for (;;) {
492 		struct xa_node *parent;
493 
494 		XA_NODE_BUG_ON(node, node->count > XA_CHUNK_SIZE);
495 		if (node->count)
496 			break;
497 
498 		parent = xa_parent_locked(xas->xa, node);
499 		xas->xa_node = parent;
500 		xas->xa_offset = node->offset;
501 		xa_node_free(node);
502 
503 		if (!parent) {
504 			xas->xa->xa_head = NULL;
505 			xas->xa_node = XAS_BOUNDS;
506 			return;
507 		}
508 
509 		parent->slots[xas->xa_offset] = NULL;
510 		parent->count--;
511 		XA_NODE_BUG_ON(parent, parent->count > XA_CHUNK_SIZE);
512 		node = parent;
513 		xas_update(xas, node);
514 	}
515 
516 	if (!node->parent)
517 		xas_shrink(xas);
518 }
519 
520 /**
521  * xas_free_nodes() - Free this node and all nodes that it references
522  * @xas: Array operation state.
523  * @top: Node to free
524  *
525  * This node has been removed from the tree.  We must now free it and all
526  * of its subnodes.  There may be RCU walkers with references into the tree,
527  * so we must replace all entries with retry markers.
528  */
529 static void xas_free_nodes(struct xa_state *xas, struct xa_node *top)
530 {
531 	unsigned int offset = 0;
532 	struct xa_node *node = top;
533 
534 	for (;;) {
535 		void *entry = xa_entry_locked(xas->xa, node, offset);
536 
537 		if (node->shift && xa_is_node(entry)) {
538 			node = xa_to_node(entry);
539 			offset = 0;
540 			continue;
541 		}
542 		if (entry)
543 			RCU_INIT_POINTER(node->slots[offset], XA_RETRY_ENTRY);
544 		offset++;
545 		while (offset == XA_CHUNK_SIZE) {
546 			struct xa_node *parent;
547 
548 			parent = xa_parent_locked(xas->xa, node);
549 			offset = node->offset + 1;
550 			node->count = 0;
551 			node->nr_values = 0;
552 			xas_update(xas, node);
553 			xa_node_free(node);
554 			if (node == top)
555 				return;
556 			node = parent;
557 		}
558 	}
559 }
560 
561 /*
562  * xas_expand adds nodes to the head of the tree until it has reached
563  * sufficient height to be able to contain @xas->xa_index
564  */
565 static int xas_expand(struct xa_state *xas, void *head)
566 {
567 	struct xarray *xa = xas->xa;
568 	struct xa_node *node = NULL;
569 	unsigned int shift = 0;
570 	unsigned long max = xas_max(xas);
571 
572 	if (!head) {
573 		if (max == 0)
574 			return 0;
575 		while ((max >> shift) >= XA_CHUNK_SIZE)
576 			shift += XA_CHUNK_SHIFT;
577 		return shift + XA_CHUNK_SHIFT;
578 	} else if (xa_is_node(head)) {
579 		node = xa_to_node(head);
580 		shift = node->shift + XA_CHUNK_SHIFT;
581 	}
582 	xas->xa_node = NULL;
583 
584 	while (max > max_index(head)) {
585 		xa_mark_t mark = 0;
586 
587 		XA_NODE_BUG_ON(node, shift > BITS_PER_LONG);
588 		node = xas_alloc(xas, shift);
589 		if (!node)
590 			return -ENOMEM;
591 
592 		node->count = 1;
593 		if (xa_is_value(head))
594 			node->nr_values = 1;
595 		RCU_INIT_POINTER(node->slots[0], head);
596 
597 		/* Propagate the aggregated mark info to the new child */
598 		for (;;) {
599 			if (xa_track_free(xa) && mark == XA_FREE_MARK) {
600 				node_mark_all(node, XA_FREE_MARK);
601 				if (!xa_marked(xa, XA_FREE_MARK)) {
602 					node_clear_mark(node, 0, XA_FREE_MARK);
603 					xa_mark_set(xa, XA_FREE_MARK);
604 				}
605 			} else if (xa_marked(xa, mark)) {
606 				node_set_mark(node, 0, mark);
607 			}
608 			if (mark == XA_MARK_MAX)
609 				break;
610 			mark_inc(mark);
611 		}
612 
613 		/*
614 		 * Now that the new node is fully initialised, we can add
615 		 * it to the tree
616 		 */
617 		if (xa_is_node(head)) {
618 			xa_to_node(head)->offset = 0;
619 			rcu_assign_pointer(xa_to_node(head)->parent, node);
620 		}
621 		head = xa_mk_node(node);
622 		rcu_assign_pointer(xa->xa_head, head);
623 		xas_update(xas, node);
624 
625 		shift += XA_CHUNK_SHIFT;
626 	}
627 
628 	xas->xa_node = node;
629 	return shift;
630 }
631 
632 /*
633  * xas_create() - Create a slot to store an entry in.
634  * @xas: XArray operation state.
635  * @allow_root: %true if we can store the entry in the root directly
636  *
637  * Most users will not need to call this function directly, as it is called
638  * by xas_store().  It is useful for doing conditional store operations
639  * (see the xa_cmpxchg() implementation for an example).
640  *
641  * Return: If the slot already existed, returns the contents of this slot.
642  * If the slot was newly created, returns %NULL.  If it failed to create the
643  * slot, returns %NULL and indicates the error in @xas.
644  */
645 static void *xas_create(struct xa_state *xas, bool allow_root)
646 {
647 	struct xarray *xa = xas->xa;
648 	void *entry;
649 	void __rcu **slot;
650 	struct xa_node *node = xas->xa_node;
651 	int shift;
652 	unsigned int order = xas->xa_shift;
653 
654 	if (xas_top(node)) {
655 		entry = xa_head_locked(xa);
656 		xas->xa_node = NULL;
657 		if (!entry && xa_zero_busy(xa))
658 			entry = XA_ZERO_ENTRY;
659 		shift = xas_expand(xas, entry);
660 		if (shift < 0)
661 			return NULL;
662 		if (!shift && !allow_root)
663 			shift = XA_CHUNK_SHIFT;
664 		entry = xa_head_locked(xa);
665 		slot = &xa->xa_head;
666 	} else if (xas_error(xas)) {
667 		return NULL;
668 	} else if (node) {
669 		unsigned int offset = xas->xa_offset;
670 
671 		shift = node->shift;
672 		entry = xa_entry_locked(xa, node, offset);
673 		slot = &node->slots[offset];
674 	} else {
675 		shift = 0;
676 		entry = xa_head_locked(xa);
677 		slot = &xa->xa_head;
678 	}
679 
680 	while (shift > order) {
681 		shift -= XA_CHUNK_SHIFT;
682 		if (!entry) {
683 			node = xas_alloc(xas, shift);
684 			if (!node)
685 				break;
686 			if (xa_track_free(xa))
687 				node_mark_all(node, XA_FREE_MARK);
688 			rcu_assign_pointer(*slot, xa_mk_node(node));
689 		} else if (xa_is_node(entry)) {
690 			node = xa_to_node(entry);
691 		} else {
692 			break;
693 		}
694 		entry = xas_descend(xas, node);
695 		slot = &node->slots[xas->xa_offset];
696 	}
697 
698 	return entry;
699 }
700 
701 /**
702  * xas_create_range() - Ensure that stores to this range will succeed
703  * @xas: XArray operation state.
704  *
705  * Creates all of the slots in the range covered by @xas.  Sets @xas to
706  * create single-index entries and positions it at the beginning of the
707  * range.  This is for the benefit of users which have not yet been
708  * converted to use multi-index entries.
709  */
710 void xas_create_range(struct xa_state *xas)
711 {
712 	unsigned long index = xas->xa_index;
713 	unsigned char shift = xas->xa_shift;
714 	unsigned char sibs = xas->xa_sibs;
715 
716 	xas->xa_index |= ((sibs + 1UL) << shift) - 1;
717 	if (xas_is_node(xas) && xas->xa_node->shift == xas->xa_shift)
718 		xas->xa_offset |= sibs;
719 	xas->xa_shift = 0;
720 	xas->xa_sibs = 0;
721 
722 	for (;;) {
723 		xas_create(xas, true);
724 		if (xas_error(xas))
725 			goto restore;
726 		if (xas->xa_index <= (index | XA_CHUNK_MASK))
727 			goto success;
728 		xas->xa_index -= XA_CHUNK_SIZE;
729 
730 		for (;;) {
731 			struct xa_node *node = xas->xa_node;
732 			if (node->shift >= shift)
733 				break;
734 			xas->xa_node = xa_parent_locked(xas->xa, node);
735 			xas->xa_offset = node->offset - 1;
736 			if (node->offset != 0)
737 				break;
738 		}
739 	}
740 
741 restore:
742 	xas->xa_shift = shift;
743 	xas->xa_sibs = sibs;
744 	xas->xa_index = index;
745 	return;
746 success:
747 	xas->xa_index = index;
748 	if (xas->xa_node)
749 		xas_set_offset(xas);
750 }
751 EXPORT_SYMBOL_GPL(xas_create_range);
752 
753 static void update_node(struct xa_state *xas, struct xa_node *node,
754 		int count, int values)
755 {
756 	if (!node || (!count && !values))
757 		return;
758 
759 	node->count += count;
760 	node->nr_values += values;
761 	XA_NODE_BUG_ON(node, node->count > XA_CHUNK_SIZE);
762 	XA_NODE_BUG_ON(node, node->nr_values > XA_CHUNK_SIZE);
763 	xas_update(xas, node);
764 	if (count < 0)
765 		xas_delete_node(xas);
766 }
767 
768 /**
769  * xas_store() - Store this entry in the XArray.
770  * @xas: XArray operation state.
771  * @entry: New entry.
772  *
773  * If @xas is operating on a multi-index entry, the entry returned by this
774  * function is essentially meaningless (it may be an internal entry or it
775  * may be %NULL, even if there are non-NULL entries at some of the indices
776  * covered by the range).  This is not a problem for any current users,
777  * and can be changed if needed.
778  *
779  * Return: The old entry at this index.
780  */
781 void *xas_store(struct xa_state *xas, void *entry)
782 {
783 	struct xa_node *node;
784 	void __rcu **slot = &xas->xa->xa_head;
785 	unsigned int offset, max;
786 	int count = 0;
787 	int values = 0;
788 	void *first, *next;
789 	bool value = xa_is_value(entry);
790 
791 	if (entry) {
792 		bool allow_root = !xa_is_node(entry) && !xa_is_zero(entry);
793 		first = xas_create(xas, allow_root);
794 	} else {
795 		first = xas_load(xas);
796 	}
797 
798 	if (xas_invalid(xas))
799 		return first;
800 	node = xas->xa_node;
801 	if (node && (xas->xa_shift < node->shift))
802 		xas->xa_sibs = 0;
803 	if ((first == entry) && !xas->xa_sibs)
804 		return first;
805 
806 	next = first;
807 	offset = xas->xa_offset;
808 	max = xas->xa_offset + xas->xa_sibs;
809 	if (node) {
810 		slot = &node->slots[offset];
811 		if (xas->xa_sibs)
812 			xas_squash_marks(xas);
813 	}
814 	if (!entry)
815 		xas_init_marks(xas);
816 
817 	for (;;) {
818 		/*
819 		 * Must clear the marks before setting the entry to NULL,
820 		 * otherwise xas_for_each_marked may find a NULL entry and
821 		 * stop early.  rcu_assign_pointer contains a release barrier
822 		 * so the mark clearing will appear to happen before the
823 		 * entry is set to NULL.
824 		 */
825 		rcu_assign_pointer(*slot, entry);
826 		if (xa_is_node(next) && (!node || node->shift))
827 			xas_free_nodes(xas, xa_to_node(next));
828 		if (!node)
829 			break;
830 		count += !next - !entry;
831 		values += !xa_is_value(first) - !value;
832 		if (entry) {
833 			if (offset == max)
834 				break;
835 			if (!xa_is_sibling(entry))
836 				entry = xa_mk_sibling(xas->xa_offset);
837 		} else {
838 			if (offset == XA_CHUNK_MASK)
839 				break;
840 		}
841 		next = xa_entry_locked(xas->xa, node, ++offset);
842 		if (!xa_is_sibling(next)) {
843 			if (!entry && (offset > max))
844 				break;
845 			first = next;
846 		}
847 		slot++;
848 	}
849 
850 	update_node(xas, node, count, values);
851 	return first;
852 }
853 EXPORT_SYMBOL_GPL(xas_store);
854 
855 /**
856  * xas_get_mark() - Returns the state of this mark.
857  * @xas: XArray operation state.
858  * @mark: Mark number.
859  *
860  * Return: true if the mark is set, false if the mark is clear or @xas
861  * is in an error state.
862  */
863 bool xas_get_mark(const struct xa_state *xas, xa_mark_t mark)
864 {
865 	if (xas_invalid(xas))
866 		return false;
867 	if (!xas->xa_node)
868 		return xa_marked(xas->xa, mark);
869 	return node_get_mark(xas->xa_node, xas->xa_offset, mark);
870 }
871 EXPORT_SYMBOL_GPL(xas_get_mark);
872 
873 /**
874  * xas_set_mark() - Sets the mark on this entry and its parents.
875  * @xas: XArray operation state.
876  * @mark: Mark number.
877  *
878  * Sets the specified mark on this entry, and walks up the tree setting it
879  * on all the ancestor entries.  Does nothing if @xas has not been walked to
880  * an entry, or is in an error state.
881  */
882 void xas_set_mark(const struct xa_state *xas, xa_mark_t mark)
883 {
884 	struct xa_node *node = xas->xa_node;
885 	unsigned int offset = xas->xa_offset;
886 
887 	if (xas_invalid(xas))
888 		return;
889 
890 	while (node) {
891 		if (node_set_mark(node, offset, mark))
892 			return;
893 		offset = node->offset;
894 		node = xa_parent_locked(xas->xa, node);
895 	}
896 
897 	if (!xa_marked(xas->xa, mark))
898 		xa_mark_set(xas->xa, mark);
899 }
900 EXPORT_SYMBOL_GPL(xas_set_mark);
901 
902 /**
903  * xas_clear_mark() - Clears the mark on this entry and its parents.
904  * @xas: XArray operation state.
905  * @mark: Mark number.
906  *
907  * Clears the specified mark on this entry, and walks back to the head
908  * attempting to clear it on all the ancestor entries.  Does nothing if
909  * @xas has not been walked to an entry, or is in an error state.
910  */
911 void xas_clear_mark(const struct xa_state *xas, xa_mark_t mark)
912 {
913 	struct xa_node *node = xas->xa_node;
914 	unsigned int offset = xas->xa_offset;
915 
916 	if (xas_invalid(xas))
917 		return;
918 
919 	while (node) {
920 		if (!node_clear_mark(node, offset, mark))
921 			return;
922 		if (node_any_mark(node, mark))
923 			return;
924 
925 		offset = node->offset;
926 		node = xa_parent_locked(xas->xa, node);
927 	}
928 
929 	if (xa_marked(xas->xa, mark))
930 		xa_mark_clear(xas->xa, mark);
931 }
932 EXPORT_SYMBOL_GPL(xas_clear_mark);
933 
934 /**
935  * xas_init_marks() - Initialise all marks for the entry
936  * @xas: Array operations state.
937  *
938  * Initialise all marks for the entry specified by @xas.  If we're tracking
939  * free entries with a mark, we need to set it on all entries.  All other
940  * marks are cleared.
941  *
942  * This implementation is not as efficient as it could be; we may walk
943  * up the tree multiple times.
944  */
945 void xas_init_marks(const struct xa_state *xas)
946 {
947 	xa_mark_t mark = 0;
948 
949 	for (;;) {
950 		if (xa_track_free(xas->xa) && mark == XA_FREE_MARK)
951 			xas_set_mark(xas, mark);
952 		else
953 			xas_clear_mark(xas, mark);
954 		if (mark == XA_MARK_MAX)
955 			break;
956 		mark_inc(mark);
957 	}
958 }
959 EXPORT_SYMBOL_GPL(xas_init_marks);
960 
961 #ifdef CONFIG_XARRAY_MULTI
962 static unsigned int node_get_marks(struct xa_node *node, unsigned int offset)
963 {
964 	unsigned int marks = 0;
965 	xa_mark_t mark = XA_MARK_0;
966 
967 	for (;;) {
968 		if (node_get_mark(node, offset, mark))
969 			marks |= 1 << (__force unsigned int)mark;
970 		if (mark == XA_MARK_MAX)
971 			break;
972 		mark_inc(mark);
973 	}
974 
975 	return marks;
976 }
977 
978 static inline void node_mark_slots(struct xa_node *node, unsigned int sibs,
979 		xa_mark_t mark)
980 {
981 	int i;
982 
983 	if (sibs == 0)
984 		node_mark_all(node, mark);
985 	else {
986 		for (i = 0; i < XA_CHUNK_SIZE; i += sibs + 1)
987 			node_set_mark(node, i, mark);
988 	}
989 }
990 
991 static void node_set_marks(struct xa_node *node, unsigned int offset,
992 			struct xa_node *child, unsigned int sibs,
993 			unsigned int marks)
994 {
995 	xa_mark_t mark = XA_MARK_0;
996 
997 	for (;;) {
998 		if (marks & (1 << (__force unsigned int)mark)) {
999 			node_set_mark(node, offset, mark);
1000 			if (child)
1001 				node_mark_slots(child, sibs, mark);
1002 		}
1003 		if (mark == XA_MARK_MAX)
1004 			break;
1005 		mark_inc(mark);
1006 	}
1007 }
1008 
1009 /**
1010  * xas_split_alloc() - Allocate memory for splitting an entry.
1011  * @xas: XArray operation state.
1012  * @entry: New entry which will be stored in the array.
1013  * @order: Current entry order.
1014  * @gfp: Memory allocation flags.
1015  *
1016  * This function should be called before calling xas_split().
1017  * If necessary, it will allocate new nodes (and fill them with @entry)
1018  * to prepare for the upcoming split of an entry of @order size into
1019  * entries of the order stored in the @xas.
1020  *
1021  * Context: May sleep if @gfp flags permit.
1022  */
1023 void xas_split_alloc(struct xa_state *xas, void *entry, unsigned int order,
1024 		gfp_t gfp)
1025 {
1026 	unsigned int sibs = (1 << (order % XA_CHUNK_SHIFT)) - 1;
1027 	unsigned int mask = xas->xa_sibs;
1028 
1029 	/* XXX: no support for splitting really large entries yet */
1030 	if (WARN_ON(xas->xa_shift + 2 * XA_CHUNK_SHIFT <= order))
1031 		goto nomem;
1032 	if (xas->xa_shift + XA_CHUNK_SHIFT > order)
1033 		return;
1034 
1035 	do {
1036 		unsigned int i;
1037 		void *sibling = NULL;
1038 		struct xa_node *node;
1039 
1040 		node = kmem_cache_alloc_lru(radix_tree_node_cachep, xas->xa_lru, gfp);
1041 		if (!node)
1042 			goto nomem;
1043 		node->array = xas->xa;
1044 		for (i = 0; i < XA_CHUNK_SIZE; i++) {
1045 			if ((i & mask) == 0) {
1046 				RCU_INIT_POINTER(node->slots[i], entry);
1047 				sibling = xa_mk_sibling(i);
1048 			} else {
1049 				RCU_INIT_POINTER(node->slots[i], sibling);
1050 			}
1051 		}
1052 		RCU_INIT_POINTER(node->parent, xas->xa_alloc);
1053 		xas->xa_alloc = node;
1054 	} while (sibs-- > 0);
1055 
1056 	return;
1057 nomem:
1058 	xas_destroy(xas);
1059 	xas_set_err(xas, -ENOMEM);
1060 }
1061 EXPORT_SYMBOL_GPL(xas_split_alloc);
1062 
1063 /**
1064  * xas_split() - Split a multi-index entry into smaller entries.
1065  * @xas: XArray operation state.
1066  * @entry: New entry to store in the array.
1067  * @order: Current entry order.
1068  *
1069  * The size of the new entries is set in @xas.  The value in @entry is
1070  * copied to all the replacement entries.
1071  *
1072  * Context: Any context.  The caller should hold the xa_lock.
1073  */
1074 void xas_split(struct xa_state *xas, void *entry, unsigned int order)
1075 {
1076 	unsigned int sibs = (1 << (order % XA_CHUNK_SHIFT)) - 1;
1077 	unsigned int offset, marks;
1078 	struct xa_node *node;
1079 	void *curr = xas_load(xas);
1080 	int values = 0;
1081 
1082 	node = xas->xa_node;
1083 	if (xas_top(node))
1084 		return;
1085 
1086 	marks = node_get_marks(node, xas->xa_offset);
1087 
1088 	offset = xas->xa_offset + sibs;
1089 	do {
1090 		if (xas->xa_shift < node->shift) {
1091 			struct xa_node *child = xas->xa_alloc;
1092 
1093 			xas->xa_alloc = rcu_dereference_raw(child->parent);
1094 			child->shift = node->shift - XA_CHUNK_SHIFT;
1095 			child->offset = offset;
1096 			child->count = XA_CHUNK_SIZE;
1097 			child->nr_values = xa_is_value(entry) ?
1098 					XA_CHUNK_SIZE : 0;
1099 			RCU_INIT_POINTER(child->parent, node);
1100 			node_set_marks(node, offset, child, xas->xa_sibs,
1101 					marks);
1102 			rcu_assign_pointer(node->slots[offset],
1103 					xa_mk_node(child));
1104 			if (xa_is_value(curr))
1105 				values--;
1106 			xas_update(xas, child);
1107 		} else {
1108 			unsigned int canon = offset - xas->xa_sibs;
1109 
1110 			node_set_marks(node, canon, NULL, 0, marks);
1111 			rcu_assign_pointer(node->slots[canon], entry);
1112 			while (offset > canon)
1113 				rcu_assign_pointer(node->slots[offset--],
1114 						xa_mk_sibling(canon));
1115 			values += (xa_is_value(entry) - xa_is_value(curr)) *
1116 					(xas->xa_sibs + 1);
1117 		}
1118 	} while (offset-- > xas->xa_offset);
1119 
1120 	node->nr_values += values;
1121 	xas_update(xas, node);
1122 }
1123 EXPORT_SYMBOL_GPL(xas_split);
1124 #endif
1125 
1126 /**
1127  * xas_pause() - Pause a walk to drop a lock.
1128  * @xas: XArray operation state.
1129  *
1130  * Some users need to pause a walk and drop the lock they're holding in
1131  * order to yield to a higher priority thread or carry out an operation
1132  * on an entry.  Those users should call this function before they drop
1133  * the lock.  It resets the @xas to be suitable for the next iteration
1134  * of the loop after the user has reacquired the lock.  If most entries
1135  * found during a walk require you to call xas_pause(), the xa_for_each()
1136  * iterator may be more appropriate.
1137  *
1138  * Note that xas_pause() only works for forward iteration.  If a user needs
1139  * to pause a reverse iteration, we will need a xas_pause_rev().
1140  */
1141 void xas_pause(struct xa_state *xas)
1142 {
1143 	struct xa_node *node = xas->xa_node;
1144 
1145 	if (xas_invalid(xas))
1146 		return;
1147 
1148 	xas->xa_node = XAS_RESTART;
1149 	if (node) {
1150 		unsigned long offset = xas->xa_offset;
1151 		while (++offset < XA_CHUNK_SIZE) {
1152 			if (!xa_is_sibling(xa_entry(xas->xa, node, offset)))
1153 				break;
1154 		}
1155 		xas->xa_index &= ~0UL << node->shift;
1156 		xas->xa_index += (offset - xas->xa_offset) << node->shift;
1157 		if (xas->xa_index == 0)
1158 			xas->xa_node = XAS_BOUNDS;
1159 	} else {
1160 		xas->xa_index++;
1161 	}
1162 }
1163 EXPORT_SYMBOL_GPL(xas_pause);
1164 
1165 /*
1166  * __xas_prev() - Find the previous entry in the XArray.
1167  * @xas: XArray operation state.
1168  *
1169  * Helper function for xas_prev() which handles all the complex cases
1170  * out of line.
1171  */
1172 void *__xas_prev(struct xa_state *xas)
1173 {
1174 	void *entry;
1175 
1176 	if (!xas_frozen(xas->xa_node))
1177 		xas->xa_index--;
1178 	if (!xas->xa_node)
1179 		return set_bounds(xas);
1180 	if (xas_not_node(xas->xa_node))
1181 		return xas_load(xas);
1182 
1183 	if (xas->xa_offset != get_offset(xas->xa_index, xas->xa_node))
1184 		xas->xa_offset--;
1185 
1186 	while (xas->xa_offset == 255) {
1187 		xas->xa_offset = xas->xa_node->offset - 1;
1188 		xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1189 		if (!xas->xa_node)
1190 			return set_bounds(xas);
1191 	}
1192 
1193 	for (;;) {
1194 		entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1195 		if (!xa_is_node(entry))
1196 			return entry;
1197 
1198 		xas->xa_node = xa_to_node(entry);
1199 		xas_set_offset(xas);
1200 	}
1201 }
1202 EXPORT_SYMBOL_GPL(__xas_prev);
1203 
1204 /*
1205  * __xas_next() - Find the next entry in the XArray.
1206  * @xas: XArray operation state.
1207  *
1208  * Helper function for xas_next() which handles all the complex cases
1209  * out of line.
1210  */
1211 void *__xas_next(struct xa_state *xas)
1212 {
1213 	void *entry;
1214 
1215 	if (!xas_frozen(xas->xa_node))
1216 		xas->xa_index++;
1217 	if (!xas->xa_node)
1218 		return set_bounds(xas);
1219 	if (xas_not_node(xas->xa_node))
1220 		return xas_load(xas);
1221 
1222 	if (xas->xa_offset != get_offset(xas->xa_index, xas->xa_node))
1223 		xas->xa_offset++;
1224 
1225 	while (xas->xa_offset == XA_CHUNK_SIZE) {
1226 		xas->xa_offset = xas->xa_node->offset + 1;
1227 		xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1228 		if (!xas->xa_node)
1229 			return set_bounds(xas);
1230 	}
1231 
1232 	for (;;) {
1233 		entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1234 		if (!xa_is_node(entry))
1235 			return entry;
1236 
1237 		xas->xa_node = xa_to_node(entry);
1238 		xas_set_offset(xas);
1239 	}
1240 }
1241 EXPORT_SYMBOL_GPL(__xas_next);
1242 
1243 /**
1244  * xas_find() - Find the next present entry in the XArray.
1245  * @xas: XArray operation state.
1246  * @max: Highest index to return.
1247  *
1248  * If the @xas has not yet been walked to an entry, return the entry
1249  * which has an index >= xas.xa_index.  If it has been walked, the entry
1250  * currently being pointed at has been processed, and so we move to the
1251  * next entry.
1252  *
1253  * If no entry is found and the array is smaller than @max, the iterator
1254  * is set to the smallest index not yet in the array.  This allows @xas
1255  * to be immediately passed to xas_store().
1256  *
1257  * Return: The entry, if found, otherwise %NULL.
1258  */
1259 void *xas_find(struct xa_state *xas, unsigned long max)
1260 {
1261 	void *entry;
1262 
1263 	if (xas_error(xas) || xas->xa_node == XAS_BOUNDS)
1264 		return NULL;
1265 	if (xas->xa_index > max)
1266 		return set_bounds(xas);
1267 
1268 	if (!xas->xa_node) {
1269 		xas->xa_index = 1;
1270 		return set_bounds(xas);
1271 	} else if (xas->xa_node == XAS_RESTART) {
1272 		entry = xas_load(xas);
1273 		if (entry || xas_not_node(xas->xa_node))
1274 			return entry;
1275 	} else if (!xas->xa_node->shift &&
1276 		    xas->xa_offset != (xas->xa_index & XA_CHUNK_MASK)) {
1277 		xas->xa_offset = ((xas->xa_index - 1) & XA_CHUNK_MASK) + 1;
1278 	}
1279 
1280 	xas_next_offset(xas);
1281 
1282 	while (xas->xa_node && (xas->xa_index <= max)) {
1283 		if (unlikely(xas->xa_offset == XA_CHUNK_SIZE)) {
1284 			xas->xa_offset = xas->xa_node->offset + 1;
1285 			xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1286 			continue;
1287 		}
1288 
1289 		entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1290 		if (xa_is_node(entry)) {
1291 			xas->xa_node = xa_to_node(entry);
1292 			xas->xa_offset = 0;
1293 			continue;
1294 		}
1295 		if (entry && !xa_is_sibling(entry))
1296 			return entry;
1297 
1298 		xas_next_offset(xas);
1299 	}
1300 
1301 	if (!xas->xa_node)
1302 		xas->xa_node = XAS_BOUNDS;
1303 	return NULL;
1304 }
1305 EXPORT_SYMBOL_GPL(xas_find);
1306 
1307 /**
1308  * xas_find_marked() - Find the next marked entry in the XArray.
1309  * @xas: XArray operation state.
1310  * @max: Highest index to return.
1311  * @mark: Mark number to search for.
1312  *
1313  * If the @xas has not yet been walked to an entry, return the marked entry
1314  * which has an index >= xas.xa_index.  If it has been walked, the entry
1315  * currently being pointed at has been processed, and so we return the
1316  * first marked entry with an index > xas.xa_index.
1317  *
1318  * If no marked entry is found and the array is smaller than @max, @xas is
1319  * set to the bounds state and xas->xa_index is set to the smallest index
1320  * not yet in the array.  This allows @xas to be immediately passed to
1321  * xas_store().
1322  *
1323  * If no entry is found before @max is reached, @xas is set to the restart
1324  * state.
1325  *
1326  * Return: The entry, if found, otherwise %NULL.
1327  */
1328 void *xas_find_marked(struct xa_state *xas, unsigned long max, xa_mark_t mark)
1329 {
1330 	bool advance = true;
1331 	unsigned int offset;
1332 	void *entry;
1333 
1334 	if (xas_error(xas))
1335 		return NULL;
1336 	if (xas->xa_index > max)
1337 		goto max;
1338 
1339 	if (!xas->xa_node) {
1340 		xas->xa_index = 1;
1341 		goto out;
1342 	} else if (xas_top(xas->xa_node)) {
1343 		advance = false;
1344 		entry = xa_head(xas->xa);
1345 		xas->xa_node = NULL;
1346 		if (xas->xa_index > max_index(entry))
1347 			goto out;
1348 		if (!xa_is_node(entry)) {
1349 			if (xa_marked(xas->xa, mark))
1350 				return entry;
1351 			xas->xa_index = 1;
1352 			goto out;
1353 		}
1354 		xas->xa_node = xa_to_node(entry);
1355 		xas->xa_offset = xas->xa_index >> xas->xa_node->shift;
1356 	}
1357 
1358 	while (xas->xa_index <= max) {
1359 		if (unlikely(xas->xa_offset == XA_CHUNK_SIZE)) {
1360 			xas->xa_offset = xas->xa_node->offset + 1;
1361 			xas->xa_node = xa_parent(xas->xa, xas->xa_node);
1362 			if (!xas->xa_node)
1363 				break;
1364 			advance = false;
1365 			continue;
1366 		}
1367 
1368 		if (!advance) {
1369 			entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1370 			if (xa_is_sibling(entry)) {
1371 				xas->xa_offset = xa_to_sibling(entry);
1372 				xas_move_index(xas, xas->xa_offset);
1373 			}
1374 		}
1375 
1376 		offset = xas_find_chunk(xas, advance, mark);
1377 		if (offset > xas->xa_offset) {
1378 			advance = false;
1379 			xas_move_index(xas, offset);
1380 			/* Mind the wrap */
1381 			if ((xas->xa_index - 1) >= max)
1382 				goto max;
1383 			xas->xa_offset = offset;
1384 			if (offset == XA_CHUNK_SIZE)
1385 				continue;
1386 		}
1387 
1388 		entry = xa_entry(xas->xa, xas->xa_node, xas->xa_offset);
1389 		if (!entry && !(xa_track_free(xas->xa) && mark == XA_FREE_MARK))
1390 			continue;
1391 		if (xa_is_sibling(entry))
1392 			continue;
1393 		if (!xa_is_node(entry))
1394 			return entry;
1395 		xas->xa_node = xa_to_node(entry);
1396 		xas_set_offset(xas);
1397 	}
1398 
1399 out:
1400 	if (xas->xa_index > max)
1401 		goto max;
1402 	return set_bounds(xas);
1403 max:
1404 	xas->xa_node = XAS_RESTART;
1405 	return NULL;
1406 }
1407 EXPORT_SYMBOL_GPL(xas_find_marked);
1408 
1409 /**
1410  * xas_find_conflict() - Find the next present entry in a range.
1411  * @xas: XArray operation state.
1412  *
1413  * The @xas describes both a range and a position within that range.
1414  *
1415  * Context: Any context.  Expects xa_lock to be held.
1416  * Return: The next entry in the range covered by @xas or %NULL.
1417  */
1418 void *xas_find_conflict(struct xa_state *xas)
1419 {
1420 	void *curr;
1421 
1422 	if (xas_error(xas))
1423 		return NULL;
1424 
1425 	if (!xas->xa_node)
1426 		return NULL;
1427 
1428 	if (xas_top(xas->xa_node)) {
1429 		curr = xas_start(xas);
1430 		if (!curr)
1431 			return NULL;
1432 		while (xa_is_node(curr)) {
1433 			struct xa_node *node = xa_to_node(curr);
1434 			curr = xas_descend(xas, node);
1435 		}
1436 		if (curr)
1437 			return curr;
1438 	}
1439 
1440 	if (xas->xa_node->shift > xas->xa_shift)
1441 		return NULL;
1442 
1443 	for (;;) {
1444 		if (xas->xa_node->shift == xas->xa_shift) {
1445 			if ((xas->xa_offset & xas->xa_sibs) == xas->xa_sibs)
1446 				break;
1447 		} else if (xas->xa_offset == XA_CHUNK_MASK) {
1448 			xas->xa_offset = xas->xa_node->offset;
1449 			xas->xa_node = xa_parent_locked(xas->xa, xas->xa_node);
1450 			if (!xas->xa_node)
1451 				break;
1452 			continue;
1453 		}
1454 		curr = xa_entry_locked(xas->xa, xas->xa_node, ++xas->xa_offset);
1455 		if (xa_is_sibling(curr))
1456 			continue;
1457 		while (xa_is_node(curr)) {
1458 			xas->xa_node = xa_to_node(curr);
1459 			xas->xa_offset = 0;
1460 			curr = xa_entry_locked(xas->xa, xas->xa_node, 0);
1461 		}
1462 		if (curr)
1463 			return curr;
1464 	}
1465 	xas->xa_offset -= xas->xa_sibs;
1466 	return NULL;
1467 }
1468 EXPORT_SYMBOL_GPL(xas_find_conflict);
1469 
1470 /**
1471  * xa_load() - Load an entry from an XArray.
1472  * @xa: XArray.
1473  * @index: index into array.
1474  *
1475  * Context: Any context.  Takes and releases the RCU lock.
1476  * Return: The entry at @index in @xa.
1477  */
1478 void *xa_load(struct xarray *xa, unsigned long index)
1479 {
1480 	XA_STATE(xas, xa, index);
1481 	void *entry;
1482 
1483 	rcu_read_lock();
1484 	do {
1485 		entry = xa_zero_to_null(xas_load(&xas));
1486 	} while (xas_retry(&xas, entry));
1487 	rcu_read_unlock();
1488 
1489 	return entry;
1490 }
1491 EXPORT_SYMBOL(xa_load);
1492 
1493 static void *xas_result(struct xa_state *xas, void *curr)
1494 {
1495 	if (xas_error(xas))
1496 		curr = xas->xa_node;
1497 	return curr;
1498 }
1499 
1500 /**
1501  * __xa_erase() - Erase this entry from the XArray while locked.
1502  * @xa: XArray.
1503  * @index: Index into array.
1504  *
1505  * After this function returns, loading from @index will return %NULL.
1506  * If the index is part of a multi-index entry, all indices will be erased
1507  * and none of the entries will be part of a multi-index entry.
1508  *
1509  * Context: Any context.  Expects xa_lock to be held on entry.
1510  * Return: The entry which used to be at this index.
1511  */
1512 void *__xa_erase(struct xarray *xa, unsigned long index)
1513 {
1514 	XA_STATE(xas, xa, index);
1515 	return xas_result(&xas, xa_zero_to_null(xas_store(&xas, NULL)));
1516 }
1517 EXPORT_SYMBOL(__xa_erase);
1518 
1519 /**
1520  * xa_erase() - Erase this entry from the XArray.
1521  * @xa: XArray.
1522  * @index: Index of entry.
1523  *
1524  * After this function returns, loading from @index will return %NULL.
1525  * If the index is part of a multi-index entry, all indices will be erased
1526  * and none of the entries will be part of a multi-index entry.
1527  *
1528  * Context: Any context.  Takes and releases the xa_lock.
1529  * Return: The entry which used to be at this index.
1530  */
1531 void *xa_erase(struct xarray *xa, unsigned long index)
1532 {
1533 	void *entry;
1534 
1535 	xa_lock(xa);
1536 	entry = __xa_erase(xa, index);
1537 	xa_unlock(xa);
1538 
1539 	return entry;
1540 }
1541 EXPORT_SYMBOL(xa_erase);
1542 
1543 /**
1544  * __xa_store() - Store this entry in the XArray.
1545  * @xa: XArray.
1546  * @index: Index into array.
1547  * @entry: New entry.
1548  * @gfp: Memory allocation flags.
1549  *
1550  * You must already be holding the xa_lock when calling this function.
1551  * It will drop the lock if needed to allocate memory, and then reacquire
1552  * it afterwards.
1553  *
1554  * Context: Any context.  Expects xa_lock to be held on entry.  May
1555  * release and reacquire xa_lock if @gfp flags permit.
1556  * Return: The old entry at this index or xa_err() if an error happened.
1557  */
1558 void *__xa_store(struct xarray *xa, unsigned long index, void *entry, gfp_t gfp)
1559 {
1560 	XA_STATE(xas, xa, index);
1561 	void *curr;
1562 
1563 	if (WARN_ON_ONCE(xa_is_advanced(entry)))
1564 		return XA_ERROR(-EINVAL);
1565 	if (xa_track_free(xa) && !entry)
1566 		entry = XA_ZERO_ENTRY;
1567 
1568 	do {
1569 		curr = xas_store(&xas, entry);
1570 		if (xa_track_free(xa))
1571 			xas_clear_mark(&xas, XA_FREE_MARK);
1572 	} while (__xas_nomem(&xas, gfp));
1573 
1574 	return xas_result(&xas, xa_zero_to_null(curr));
1575 }
1576 EXPORT_SYMBOL(__xa_store);
1577 
1578 /**
1579  * xa_store() - Store this entry in the XArray.
1580  * @xa: XArray.
1581  * @index: Index into array.
1582  * @entry: New entry.
1583  * @gfp: Memory allocation flags.
1584  *
1585  * After this function returns, loads from this index will return @entry.
1586  * Storing into an existing multi-index entry updates the entry of every index.
1587  * The marks associated with @index are unaffected unless @entry is %NULL.
1588  *
1589  * Context: Any context.  Takes and releases the xa_lock.
1590  * May sleep if the @gfp flags permit.
1591  * Return: The old entry at this index on success, xa_err(-EINVAL) if @entry
1592  * cannot be stored in an XArray, or xa_err(-ENOMEM) if memory allocation
1593  * failed.
1594  */
1595 void *xa_store(struct xarray *xa, unsigned long index, void *entry, gfp_t gfp)
1596 {
1597 	void *curr;
1598 
1599 	xa_lock(xa);
1600 	curr = __xa_store(xa, index, entry, gfp);
1601 	xa_unlock(xa);
1602 
1603 	return curr;
1604 }
1605 EXPORT_SYMBOL(xa_store);
1606 
1607 static inline void *__xa_cmpxchg_raw(struct xarray *xa, unsigned long index,
1608 			void *old, void *entry, gfp_t gfp);
1609 
1610 /**
1611  * __xa_cmpxchg() - Store this entry in the XArray.
1612  * @xa: XArray.
1613  * @index: Index into array.
1614  * @old: Old value to test against.
1615  * @entry: New entry.
1616  * @gfp: Memory allocation flags.
1617  *
1618  * You must already be holding the xa_lock when calling this function.
1619  * It will drop the lock if needed to allocate memory, and then reacquire
1620  * it afterwards.
1621  *
1622  * Context: Any context.  Expects xa_lock to be held on entry.  May
1623  * release and reacquire xa_lock if @gfp flags permit.
1624  * Return: The old entry at this index or xa_err() if an error happened.
1625  */
1626 void *__xa_cmpxchg(struct xarray *xa, unsigned long index,
1627 			void *old, void *entry, gfp_t gfp)
1628 {
1629 	return xa_zero_to_null(__xa_cmpxchg_raw(xa, index, old, entry, gfp));
1630 }
1631 EXPORT_SYMBOL(__xa_cmpxchg);
1632 
1633 static inline void *__xa_cmpxchg_raw(struct xarray *xa, unsigned long index,
1634 			void *old, void *entry, gfp_t gfp)
1635 {
1636 	XA_STATE(xas, xa, index);
1637 	void *curr;
1638 
1639 	if (WARN_ON_ONCE(xa_is_advanced(entry)))
1640 		return XA_ERROR(-EINVAL);
1641 
1642 	do {
1643 		curr = xas_load(&xas);
1644 		if (curr == old) {
1645 			xas_store(&xas, entry);
1646 			if (xa_track_free(xa) && entry && !curr)
1647 				xas_clear_mark(&xas, XA_FREE_MARK);
1648 		}
1649 	} while (__xas_nomem(&xas, gfp));
1650 
1651 	return xas_result(&xas, curr);
1652 }
1653 
1654 /**
1655  * __xa_insert() - Store this entry in the XArray if no entry is present.
1656  * @xa: XArray.
1657  * @index: Index into array.
1658  * @entry: New entry.
1659  * @gfp: Memory allocation flags.
1660  *
1661  * Inserting a NULL entry will store a reserved entry (like xa_reserve())
1662  * if no entry is present.  Inserting will fail if a reserved entry is
1663  * present, even though loading from this index will return NULL.
1664  *
1665  * Context: Any context.  Expects xa_lock to be held on entry.  May
1666  * release and reacquire xa_lock if @gfp flags permit.
1667  * Return: 0 if the store succeeded.  -EBUSY if another entry was present.
1668  * -ENOMEM if memory could not be allocated.
1669  */
1670 int __xa_insert(struct xarray *xa, unsigned long index, void *entry, gfp_t gfp)
1671 {
1672 	void *curr;
1673 	int errno;
1674 
1675 	if (!entry)
1676 		entry = XA_ZERO_ENTRY;
1677 	curr = __xa_cmpxchg_raw(xa, index, NULL, entry, gfp);
1678 	errno = xa_err(curr);
1679 	if (errno)
1680 		return errno;
1681 	return (curr != NULL) ? -EBUSY : 0;
1682 }
1683 EXPORT_SYMBOL(__xa_insert);
1684 
1685 #ifdef CONFIG_XARRAY_MULTI
1686 static void xas_set_range(struct xa_state *xas, unsigned long first,
1687 		unsigned long last)
1688 {
1689 	unsigned int shift = 0;
1690 	unsigned long sibs = last - first;
1691 	unsigned int offset = XA_CHUNK_MASK;
1692 
1693 	xas_set(xas, first);
1694 
1695 	while ((first & XA_CHUNK_MASK) == 0) {
1696 		if (sibs < XA_CHUNK_MASK)
1697 			break;
1698 		if ((sibs == XA_CHUNK_MASK) && (offset < XA_CHUNK_MASK))
1699 			break;
1700 		shift += XA_CHUNK_SHIFT;
1701 		if (offset == XA_CHUNK_MASK)
1702 			offset = sibs & XA_CHUNK_MASK;
1703 		sibs >>= XA_CHUNK_SHIFT;
1704 		first >>= XA_CHUNK_SHIFT;
1705 	}
1706 
1707 	offset = first & XA_CHUNK_MASK;
1708 	if (offset + sibs > XA_CHUNK_MASK)
1709 		sibs = XA_CHUNK_MASK - offset;
1710 	if ((((first + sibs + 1) << shift) - 1) > last)
1711 		sibs -= 1;
1712 
1713 	xas->xa_shift = shift;
1714 	xas->xa_sibs = sibs;
1715 }
1716 
1717 /**
1718  * xa_store_range() - Store this entry at a range of indices in the XArray.
1719  * @xa: XArray.
1720  * @first: First index to affect.
1721  * @last: Last index to affect.
1722  * @entry: New entry.
1723  * @gfp: Memory allocation flags.
1724  *
1725  * After this function returns, loads from any index between @first and @last,
1726  * inclusive will return @entry.
1727  * Storing into an existing multi-index entry updates the entry of every index.
1728  * The marks associated with @index are unaffected unless @entry is %NULL.
1729  *
1730  * Context: Process context.  Takes and releases the xa_lock.  May sleep
1731  * if the @gfp flags permit.
1732  * Return: %NULL on success, xa_err(-EINVAL) if @entry cannot be stored in
1733  * an XArray, or xa_err(-ENOMEM) if memory allocation failed.
1734  */
1735 void *xa_store_range(struct xarray *xa, unsigned long first,
1736 		unsigned long last, void *entry, gfp_t gfp)
1737 {
1738 	XA_STATE(xas, xa, 0);
1739 
1740 	if (WARN_ON_ONCE(xa_is_internal(entry)))
1741 		return XA_ERROR(-EINVAL);
1742 	if (last < first)
1743 		return XA_ERROR(-EINVAL);
1744 
1745 	do {
1746 		xas_lock(&xas);
1747 		if (entry) {
1748 			unsigned int order = BITS_PER_LONG;
1749 			if (last + 1)
1750 				order = __ffs(last + 1);
1751 			xas_set_order(&xas, last, order);
1752 			xas_create(&xas, true);
1753 			if (xas_error(&xas))
1754 				goto unlock;
1755 		}
1756 		do {
1757 			xas_set_range(&xas, first, last);
1758 			xas_store(&xas, entry);
1759 			if (xas_error(&xas))
1760 				goto unlock;
1761 			first += xas_size(&xas);
1762 		} while (first <= last);
1763 unlock:
1764 		xas_unlock(&xas);
1765 	} while (xas_nomem(&xas, gfp));
1766 
1767 	return xas_result(&xas, NULL);
1768 }
1769 EXPORT_SYMBOL(xa_store_range);
1770 
1771 /**
1772  * xas_get_order() - Get the order of an entry.
1773  * @xas: XArray operation state.
1774  *
1775  * Called after xas_load, the xas should not be in an error state.
1776  *
1777  * Return: A number between 0 and 63 indicating the order of the entry.
1778  */
1779 int xas_get_order(struct xa_state *xas)
1780 {
1781 	int order = 0;
1782 
1783 	if (!xas->xa_node)
1784 		return 0;
1785 
1786 	for (;;) {
1787 		unsigned int slot = xas->xa_offset + (1 << order);
1788 
1789 		if (slot >= XA_CHUNK_SIZE)
1790 			break;
1791 		if (!xa_is_sibling(xa_entry(xas->xa, xas->xa_node, slot)))
1792 			break;
1793 		order++;
1794 	}
1795 
1796 	order += xas->xa_node->shift;
1797 	return order;
1798 }
1799 EXPORT_SYMBOL_GPL(xas_get_order);
1800 
1801 /**
1802  * xa_get_order() - Get the order of an entry.
1803  * @xa: XArray.
1804  * @index: Index of the entry.
1805  *
1806  * Return: A number between 0 and 63 indicating the order of the entry.
1807  */
1808 int xa_get_order(struct xarray *xa, unsigned long index)
1809 {
1810 	XA_STATE(xas, xa, index);
1811 	int order = 0;
1812 	void *entry;
1813 
1814 	rcu_read_lock();
1815 	entry = xas_load(&xas);
1816 	if (entry)
1817 		order = xas_get_order(&xas);
1818 	rcu_read_unlock();
1819 
1820 	return order;
1821 }
1822 EXPORT_SYMBOL(xa_get_order);
1823 #endif /* CONFIG_XARRAY_MULTI */
1824 
1825 /**
1826  * __xa_alloc() - Find somewhere to store this entry in the XArray.
1827  * @xa: XArray.
1828  * @id: Pointer to ID.
1829  * @limit: Range for allocated ID.
1830  * @entry: New entry.
1831  * @gfp: Memory allocation flags.
1832  *
1833  * Finds an empty entry in @xa between @limit.min and @limit.max,
1834  * stores the index into the @id pointer, then stores the entry at
1835  * that index.  A concurrent lookup will not see an uninitialised @id.
1836  *
1837  * Must only be operated on an xarray initialized with flag XA_FLAGS_ALLOC set
1838  * in xa_init_flags().
1839  *
1840  * Context: Any context.  Expects xa_lock to be held on entry.  May
1841  * release and reacquire xa_lock if @gfp flags permit.
1842  * Return: 0 on success, -ENOMEM if memory could not be allocated or
1843  * -EBUSY if there are no free entries in @limit.
1844  */
1845 int __xa_alloc(struct xarray *xa, u32 *id, void *entry,
1846 		struct xa_limit limit, gfp_t gfp)
1847 {
1848 	XA_STATE(xas, xa, 0);
1849 
1850 	if (WARN_ON_ONCE(xa_is_advanced(entry)))
1851 		return -EINVAL;
1852 	if (WARN_ON_ONCE(!xa_track_free(xa)))
1853 		return -EINVAL;
1854 
1855 	if (!entry)
1856 		entry = XA_ZERO_ENTRY;
1857 
1858 	do {
1859 		xas.xa_index = limit.min;
1860 		xas_find_marked(&xas, limit.max, XA_FREE_MARK);
1861 		if (xas.xa_node == XAS_RESTART)
1862 			xas_set_err(&xas, -EBUSY);
1863 		else
1864 			*id = xas.xa_index;
1865 		xas_store(&xas, entry);
1866 		xas_clear_mark(&xas, XA_FREE_MARK);
1867 	} while (__xas_nomem(&xas, gfp));
1868 
1869 	return xas_error(&xas);
1870 }
1871 EXPORT_SYMBOL(__xa_alloc);
1872 
1873 /**
1874  * __xa_alloc_cyclic() - Find somewhere to store this entry in the XArray.
1875  * @xa: XArray.
1876  * @id: Pointer to ID.
1877  * @entry: New entry.
1878  * @limit: Range of allocated ID.
1879  * @next: Pointer to next ID to allocate.
1880  * @gfp: Memory allocation flags.
1881  *
1882  * Finds an empty entry in @xa between @limit.min and @limit.max,
1883  * stores the index into the @id pointer, then stores the entry at
1884  * that index.  A concurrent lookup will not see an uninitialised @id.
1885  * The search for an empty entry will start at @next and will wrap
1886  * around if necessary.
1887  *
1888  * Must only be operated on an xarray initialized with flag XA_FLAGS_ALLOC set
1889  * in xa_init_flags().
1890  *
1891  * Context: Any context.  Expects xa_lock to be held on entry.  May
1892  * release and reacquire xa_lock if @gfp flags permit.
1893  * Return: 0 if the allocation succeeded without wrapping.  1 if the
1894  * allocation succeeded after wrapping, -ENOMEM if memory could not be
1895  * allocated or -EBUSY if there are no free entries in @limit.
1896  */
1897 int __xa_alloc_cyclic(struct xarray *xa, u32 *id, void *entry,
1898 		struct xa_limit limit, u32 *next, gfp_t gfp)
1899 {
1900 	u32 min = limit.min;
1901 	int ret;
1902 
1903 	limit.min = max(min, *next);
1904 	ret = __xa_alloc(xa, id, entry, limit, gfp);
1905 	if ((xa->xa_flags & XA_FLAGS_ALLOC_WRAPPED) && ret == 0) {
1906 		xa->xa_flags &= ~XA_FLAGS_ALLOC_WRAPPED;
1907 		ret = 1;
1908 	}
1909 
1910 	if (ret < 0 && limit.min > min) {
1911 		limit.min = min;
1912 		ret = __xa_alloc(xa, id, entry, limit, gfp);
1913 		if (ret == 0)
1914 			ret = 1;
1915 	}
1916 
1917 	if (ret >= 0) {
1918 		*next = *id + 1;
1919 		if (*next == 0)
1920 			xa->xa_flags |= XA_FLAGS_ALLOC_WRAPPED;
1921 	}
1922 	return ret;
1923 }
1924 EXPORT_SYMBOL(__xa_alloc_cyclic);
1925 
1926 /**
1927  * __xa_set_mark() - Set this mark on this entry while locked.
1928  * @xa: XArray.
1929  * @index: Index of entry.
1930  * @mark: Mark number.
1931  *
1932  * Attempting to set a mark on a %NULL entry does not succeed.
1933  *
1934  * Context: Any context.  Expects xa_lock to be held on entry.
1935  */
1936 void __xa_set_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1937 {
1938 	XA_STATE(xas, xa, index);
1939 	void *entry = xas_load(&xas);
1940 
1941 	if (entry)
1942 		xas_set_mark(&xas, mark);
1943 }
1944 EXPORT_SYMBOL(__xa_set_mark);
1945 
1946 /**
1947  * __xa_clear_mark() - Clear this mark on this entry while locked.
1948  * @xa: XArray.
1949  * @index: Index of entry.
1950  * @mark: Mark number.
1951  *
1952  * Context: Any context.  Expects xa_lock to be held on entry.
1953  */
1954 void __xa_clear_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1955 {
1956 	XA_STATE(xas, xa, index);
1957 	void *entry = xas_load(&xas);
1958 
1959 	if (entry)
1960 		xas_clear_mark(&xas, mark);
1961 }
1962 EXPORT_SYMBOL(__xa_clear_mark);
1963 
1964 /**
1965  * xa_get_mark() - Inquire whether this mark is set on this entry.
1966  * @xa: XArray.
1967  * @index: Index of entry.
1968  * @mark: Mark number.
1969  *
1970  * This function uses the RCU read lock, so the result may be out of date
1971  * by the time it returns.  If you need the result to be stable, use a lock.
1972  *
1973  * Context: Any context.  Takes and releases the RCU lock.
1974  * Return: True if the entry at @index has this mark set, false if it doesn't.
1975  */
1976 bool xa_get_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
1977 {
1978 	XA_STATE(xas, xa, index);
1979 	void *entry;
1980 
1981 	rcu_read_lock();
1982 	entry = xas_start(&xas);
1983 	while (xas_get_mark(&xas, mark)) {
1984 		if (!xa_is_node(entry))
1985 			goto found;
1986 		entry = xas_descend(&xas, xa_to_node(entry));
1987 	}
1988 	rcu_read_unlock();
1989 	return false;
1990  found:
1991 	rcu_read_unlock();
1992 	return true;
1993 }
1994 EXPORT_SYMBOL(xa_get_mark);
1995 
1996 /**
1997  * xa_set_mark() - Set this mark on this entry.
1998  * @xa: XArray.
1999  * @index: Index of entry.
2000  * @mark: Mark number.
2001  *
2002  * Attempting to set a mark on a %NULL entry does not succeed.
2003  *
2004  * Context: Process context.  Takes and releases the xa_lock.
2005  */
2006 void xa_set_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
2007 {
2008 	xa_lock(xa);
2009 	__xa_set_mark(xa, index, mark);
2010 	xa_unlock(xa);
2011 }
2012 EXPORT_SYMBOL(xa_set_mark);
2013 
2014 /**
2015  * xa_clear_mark() - Clear this mark on this entry.
2016  * @xa: XArray.
2017  * @index: Index of entry.
2018  * @mark: Mark number.
2019  *
2020  * Clearing a mark always succeeds.
2021  *
2022  * Context: Process context.  Takes and releases the xa_lock.
2023  */
2024 void xa_clear_mark(struct xarray *xa, unsigned long index, xa_mark_t mark)
2025 {
2026 	xa_lock(xa);
2027 	__xa_clear_mark(xa, index, mark);
2028 	xa_unlock(xa);
2029 }
2030 EXPORT_SYMBOL(xa_clear_mark);
2031 
2032 /**
2033  * xa_find() - Search the XArray for an entry.
2034  * @xa: XArray.
2035  * @indexp: Pointer to an index.
2036  * @max: Maximum index to search to.
2037  * @filter: Selection criterion.
2038  *
2039  * Finds the entry in @xa which matches the @filter, and has the lowest
2040  * index that is at least @indexp and no more than @max.
2041  * If an entry is found, @indexp is updated to be the index of the entry.
2042  * This function is protected by the RCU read lock, so it may not find
2043  * entries which are being simultaneously added.  It will not return an
2044  * %XA_RETRY_ENTRY; if you need to see retry entries, use xas_find().
2045  *
2046  * Context: Any context.  Takes and releases the RCU lock.
2047  * Return: The entry, if found, otherwise %NULL.
2048  */
2049 void *xa_find(struct xarray *xa, unsigned long *indexp,
2050 			unsigned long max, xa_mark_t filter)
2051 {
2052 	XA_STATE(xas, xa, *indexp);
2053 	void *entry;
2054 
2055 	rcu_read_lock();
2056 	do {
2057 		if ((__force unsigned int)filter < XA_MAX_MARKS)
2058 			entry = xas_find_marked(&xas, max, filter);
2059 		else
2060 			entry = xas_find(&xas, max);
2061 	} while (xas_retry(&xas, entry));
2062 	rcu_read_unlock();
2063 
2064 	if (entry)
2065 		*indexp = xas.xa_index;
2066 	return entry;
2067 }
2068 EXPORT_SYMBOL(xa_find);
2069 
2070 static bool xas_sibling(struct xa_state *xas)
2071 {
2072 	struct xa_node *node = xas->xa_node;
2073 	unsigned long mask;
2074 
2075 	if (!IS_ENABLED(CONFIG_XARRAY_MULTI) || !node)
2076 		return false;
2077 	mask = (XA_CHUNK_SIZE << node->shift) - 1;
2078 	return (xas->xa_index & mask) >
2079 		((unsigned long)xas->xa_offset << node->shift);
2080 }
2081 
2082 /**
2083  * xa_find_after() - Search the XArray for a present entry.
2084  * @xa: XArray.
2085  * @indexp: Pointer to an index.
2086  * @max: Maximum index to search to.
2087  * @filter: Selection criterion.
2088  *
2089  * Finds the entry in @xa which matches the @filter and has the lowest
2090  * index that is above @indexp and no more than @max.
2091  * If an entry is found, @indexp is updated to be the index of the entry.
2092  * This function is protected by the RCU read lock, so it may miss entries
2093  * which are being simultaneously added.  It will not return an
2094  * %XA_RETRY_ENTRY; if you need to see retry entries, use xas_find().
2095  *
2096  * Context: Any context.  Takes and releases the RCU lock.
2097  * Return: The pointer, if found, otherwise %NULL.
2098  */
2099 void *xa_find_after(struct xarray *xa, unsigned long *indexp,
2100 			unsigned long max, xa_mark_t filter)
2101 {
2102 	XA_STATE(xas, xa, *indexp + 1);
2103 	void *entry;
2104 
2105 	if (xas.xa_index == 0)
2106 		return NULL;
2107 
2108 	rcu_read_lock();
2109 	for (;;) {
2110 		if ((__force unsigned int)filter < XA_MAX_MARKS)
2111 			entry = xas_find_marked(&xas, max, filter);
2112 		else
2113 			entry = xas_find(&xas, max);
2114 
2115 		if (xas_invalid(&xas))
2116 			break;
2117 		if (xas_sibling(&xas))
2118 			continue;
2119 		if (!xas_retry(&xas, entry))
2120 			break;
2121 	}
2122 	rcu_read_unlock();
2123 
2124 	if (entry)
2125 		*indexp = xas.xa_index;
2126 	return entry;
2127 }
2128 EXPORT_SYMBOL(xa_find_after);
2129 
2130 static unsigned int xas_extract_present(struct xa_state *xas, void **dst,
2131 			unsigned long max, unsigned int n)
2132 {
2133 	void *entry;
2134 	unsigned int i = 0;
2135 
2136 	rcu_read_lock();
2137 	xas_for_each(xas, entry, max) {
2138 		if (xas_retry(xas, entry))
2139 			continue;
2140 		dst[i++] = entry;
2141 		if (i == n)
2142 			break;
2143 	}
2144 	rcu_read_unlock();
2145 
2146 	return i;
2147 }
2148 
2149 static unsigned int xas_extract_marked(struct xa_state *xas, void **dst,
2150 			unsigned long max, unsigned int n, xa_mark_t mark)
2151 {
2152 	void *entry;
2153 	unsigned int i = 0;
2154 
2155 	rcu_read_lock();
2156 	xas_for_each_marked(xas, entry, max, mark) {
2157 		if (xas_retry(xas, entry))
2158 			continue;
2159 		dst[i++] = entry;
2160 		if (i == n)
2161 			break;
2162 	}
2163 	rcu_read_unlock();
2164 
2165 	return i;
2166 }
2167 
2168 /**
2169  * xa_extract() - Copy selected entries from the XArray into a normal array.
2170  * @xa: The source XArray to copy from.
2171  * @dst: The buffer to copy entries into.
2172  * @start: The first index in the XArray eligible to be selected.
2173  * @max: The last index in the XArray eligible to be selected.
2174  * @n: The maximum number of entries to copy.
2175  * @filter: Selection criterion.
2176  *
2177  * Copies up to @n entries that match @filter from the XArray.  The
2178  * copied entries will have indices between @start and @max, inclusive.
2179  *
2180  * The @filter may be an XArray mark value, in which case entries which are
2181  * marked with that mark will be copied.  It may also be %XA_PRESENT, in
2182  * which case all entries which are not %NULL will be copied.
2183  *
2184  * The entries returned may not represent a snapshot of the XArray at a
2185  * moment in time.  For example, if another thread stores to index 5, then
2186  * index 10, calling xa_extract() may return the old contents of index 5
2187  * and the new contents of index 10.  Indices not modified while this
2188  * function is running will not be skipped.
2189  *
2190  * If you need stronger guarantees, holding the xa_lock across calls to this
2191  * function will prevent concurrent modification.
2192  *
2193  * Context: Any context.  Takes and releases the RCU lock.
2194  * Return: The number of entries copied.
2195  */
2196 unsigned int xa_extract(struct xarray *xa, void **dst, unsigned long start,
2197 			unsigned long max, unsigned int n, xa_mark_t filter)
2198 {
2199 	XA_STATE(xas, xa, start);
2200 
2201 	if (!n)
2202 		return 0;
2203 
2204 	if ((__force unsigned int)filter < XA_MAX_MARKS)
2205 		return xas_extract_marked(&xas, dst, max, n, filter);
2206 	return xas_extract_present(&xas, dst, max, n);
2207 }
2208 EXPORT_SYMBOL(xa_extract);
2209 
2210 /**
2211  * xa_delete_node() - Private interface for workingset code.
2212  * @node: Node to be removed from the tree.
2213  * @update: Function to call to update ancestor nodes.
2214  *
2215  * Context: xa_lock must be held on entry and will not be released.
2216  */
2217 void xa_delete_node(struct xa_node *node, xa_update_node_t update)
2218 {
2219 	struct xa_state xas = {
2220 		.xa = node->array,
2221 		.xa_index = (unsigned long)node->offset <<
2222 				(node->shift + XA_CHUNK_SHIFT),
2223 		.xa_shift = node->shift + XA_CHUNK_SHIFT,
2224 		.xa_offset = node->offset,
2225 		.xa_node = xa_parent_locked(node->array, node),
2226 		.xa_update = update,
2227 	};
2228 
2229 	xas_store(&xas, NULL);
2230 }
2231 EXPORT_SYMBOL_GPL(xa_delete_node);	/* For the benefit of the test suite */
2232 
2233 /**
2234  * xa_destroy() - Free all internal data structures.
2235  * @xa: XArray.
2236  *
2237  * After calling this function, the XArray is empty and has freed all memory
2238  * allocated for its internal data structures.  You are responsible for
2239  * freeing the objects referenced by the XArray.
2240  *
2241  * Context: Any context.  Takes and releases the xa_lock, interrupt-safe.
2242  */
2243 void xa_destroy(struct xarray *xa)
2244 {
2245 	XA_STATE(xas, xa, 0);
2246 	unsigned long flags;
2247 	void *entry;
2248 
2249 	xas.xa_node = NULL;
2250 	xas_lock_irqsave(&xas, flags);
2251 	entry = xa_head_locked(xa);
2252 	RCU_INIT_POINTER(xa->xa_head, NULL);
2253 	xas_init_marks(&xas);
2254 	if (xa_zero_busy(xa))
2255 		xa_mark_clear(xa, XA_FREE_MARK);
2256 	/* lockdep checks we're still holding the lock in xas_free_nodes() */
2257 	if (xa_is_node(entry))
2258 		xas_free_nodes(&xas, xa_to_node(entry));
2259 	xas_unlock_irqrestore(&xas, flags);
2260 }
2261 EXPORT_SYMBOL(xa_destroy);
2262 
2263 #ifdef XA_DEBUG
2264 void xa_dump_node(const struct xa_node *node)
2265 {
2266 	unsigned i, j;
2267 
2268 	if (!node)
2269 		return;
2270 	if ((unsigned long)node & 3) {
2271 		pr_cont("node %px\n", node);
2272 		return;
2273 	}
2274 
2275 	pr_cont("node %px %s %d parent %px shift %d count %d values %d "
2276 		"array %px list %px %px marks",
2277 		node, node->parent ? "offset" : "max", node->offset,
2278 		node->parent, node->shift, node->count, node->nr_values,
2279 		node->array, node->private_list.prev, node->private_list.next);
2280 	for (i = 0; i < XA_MAX_MARKS; i++)
2281 		for (j = 0; j < XA_MARK_LONGS; j++)
2282 			pr_cont(" %lx", node->marks[i][j]);
2283 	pr_cont("\n");
2284 }
2285 
2286 void xa_dump_index(unsigned long index, unsigned int shift)
2287 {
2288 	if (!shift)
2289 		pr_info("%lu: ", index);
2290 	else if (shift >= BITS_PER_LONG)
2291 		pr_info("0-%lu: ", ~0UL);
2292 	else
2293 		pr_info("%lu-%lu: ", index, index | ((1UL << shift) - 1));
2294 }
2295 
2296 void xa_dump_entry(const void *entry, unsigned long index, unsigned long shift)
2297 {
2298 	if (!entry)
2299 		return;
2300 
2301 	xa_dump_index(index, shift);
2302 
2303 	if (xa_is_node(entry)) {
2304 		if (shift == 0) {
2305 			pr_cont("%px\n", entry);
2306 		} else {
2307 			unsigned long i;
2308 			struct xa_node *node = xa_to_node(entry);
2309 			xa_dump_node(node);
2310 			for (i = 0; i < XA_CHUNK_SIZE; i++)
2311 				xa_dump_entry(node->slots[i],
2312 				      index + (i << node->shift), node->shift);
2313 		}
2314 	} else if (xa_is_value(entry))
2315 		pr_cont("value %ld (0x%lx) [%px]\n", xa_to_value(entry),
2316 						xa_to_value(entry), entry);
2317 	else if (!xa_is_internal(entry))
2318 		pr_cont("%px\n", entry);
2319 	else if (xa_is_retry(entry))
2320 		pr_cont("retry (%ld)\n", xa_to_internal(entry));
2321 	else if (xa_is_sibling(entry))
2322 		pr_cont("sibling (slot %ld)\n", xa_to_sibling(entry));
2323 	else if (xa_is_zero(entry))
2324 		pr_cont("zero (%ld)\n", xa_to_internal(entry));
2325 	else
2326 		pr_cont("UNKNOWN ENTRY (%px)\n", entry);
2327 }
2328 
2329 void xa_dump(const struct xarray *xa)
2330 {
2331 	void *entry = xa->xa_head;
2332 	unsigned int shift = 0;
2333 
2334 	pr_info("xarray: %px head %px flags %x marks %d %d %d\n", xa, entry,
2335 			xa->xa_flags, xa_marked(xa, XA_MARK_0),
2336 			xa_marked(xa, XA_MARK_1), xa_marked(xa, XA_MARK_2));
2337 	if (xa_is_node(entry))
2338 		shift = xa_to_node(entry)->shift + XA_CHUNK_SHIFT;
2339 	xa_dump_entry(entry, 0, shift);
2340 }
2341 #endif
2342