blob: deae17aa0ed7fb26296420f1802ffebcbc8d8764 [file] [log] [blame]
Matthew Wilcoxf6bb2a22018-04-10 16:36:52 -07001/* SPDX-License-Identifier: GPL-2.0+ */
2#ifndef _LINUX_XARRAY_H
3#define _LINUX_XARRAY_H
4/*
5 * eXtensible Arrays
6 * Copyright (c) 2017 Microsoft Corporation
Matthew Wilcox3d0186b2018-06-16 17:32:07 -04007 * Author: Matthew Wilcox <willy@infradead.org>
Matthew Wilcox3159f942017-11-03 13:30:42 -04008 *
9 * See Documentation/core-api/xarray.rst for how to use the XArray.
Matthew Wilcoxf6bb2a22018-04-10 16:36:52 -070010 */
11
Matthew Wilcox3159f942017-11-03 13:30:42 -040012#include <linux/bug.h>
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -050013#include <linux/compiler.h>
Matthew Wilcox9b89a032017-11-10 09:34:31 -050014#include <linux/gfp.h>
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -050015#include <linux/kconfig.h>
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -050016#include <linux/kernel.h>
17#include <linux/rcupdate.h>
Matthew Wilcoxf6bb2a22018-04-10 16:36:52 -070018#include <linux/spinlock.h>
Matthew Wilcox3159f942017-11-03 13:30:42 -040019#include <linux/types.h>
20
21/*
22 * The bottom two bits of the entry determine how the XArray interprets
23 * the contents:
24 *
25 * 00: Pointer entry
26 * 10: Internal entry
27 * x1: Value entry or tagged pointer
28 *
29 * Attempting to store internal entries in the XArray is a bug.
Matthew Wilcox02c02bf2017-11-03 23:09:45 -040030 *
31 * Most internal entries are pointers to the next node in the tree.
32 * The following internal entries have a special meaning:
33 *
34 * 0-62: Sibling entries
35 * 256: Retry entry
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -050036 *
37 * Errors are also represented as internal entries, but use the negative
38 * space (-4094 to -2). They're never stored in the slots array; only
39 * returned by the normal API.
Matthew Wilcox3159f942017-11-03 13:30:42 -040040 */
41
42#define BITS_PER_XA_VALUE (BITS_PER_LONG - 1)
43
44/**
45 * xa_mk_value() - Create an XArray entry from an integer.
46 * @v: Value to store in XArray.
47 *
48 * Context: Any context.
49 * Return: An entry suitable for storing in the XArray.
50 */
51static inline void *xa_mk_value(unsigned long v)
52{
53 WARN_ON((long)v < 0);
54 return (void *)((v << 1) | 1);
55}
56
57/**
58 * xa_to_value() - Get value stored in an XArray entry.
59 * @entry: XArray entry.
60 *
61 * Context: Any context.
62 * Return: The value stored in the XArray entry.
63 */
64static inline unsigned long xa_to_value(const void *entry)
65{
66 return (unsigned long)entry >> 1;
67}
68
69/**
70 * xa_is_value() - Determine if an entry is a value.
71 * @entry: XArray entry.
72 *
73 * Context: Any context.
74 * Return: True if the entry is a value, false if it is a pointer.
75 */
76static inline bool xa_is_value(const void *entry)
77{
78 return (unsigned long)entry & 1;
79}
80
81/**
82 * xa_tag_pointer() - Create an XArray entry for a tagged pointer.
83 * @p: Plain pointer.
84 * @tag: Tag value (0, 1 or 3).
85 *
86 * If the user of the XArray prefers, they can tag their pointers instead
87 * of storing value entries. Three tags are available (0, 1 and 3).
88 * These are distinct from the xa_mark_t as they are not replicated up
89 * through the array and cannot be searched for.
90 *
91 * Context: Any context.
92 * Return: An XArray entry.
93 */
94static inline void *xa_tag_pointer(void *p, unsigned long tag)
95{
96 return (void *)((unsigned long)p | tag);
97}
98
99/**
100 * xa_untag_pointer() - Turn an XArray entry into a plain pointer.
101 * @entry: XArray entry.
102 *
103 * If you have stored a tagged pointer in the XArray, call this function
104 * to get the untagged version of the pointer.
105 *
106 * Context: Any context.
107 * Return: A pointer.
108 */
109static inline void *xa_untag_pointer(void *entry)
110{
111 return (void *)((unsigned long)entry & ~3UL);
112}
113
114/**
115 * xa_pointer_tag() - Get the tag stored in an XArray entry.
116 * @entry: XArray entry.
117 *
118 * If you have stored a tagged pointer in the XArray, call this function
119 * to get the tag of that pointer.
120 *
121 * Context: Any context.
122 * Return: A tag.
123 */
124static inline unsigned int xa_pointer_tag(void *entry)
125{
126 return (unsigned long)entry & 3UL;
127}
Matthew Wilcoxf6bb2a22018-04-10 16:36:52 -0700128
Matthew Wilcox02c02bf2017-11-03 23:09:45 -0400129/*
130 * xa_mk_internal() - Create an internal entry.
131 * @v: Value to turn into an internal entry.
132 *
133 * Context: Any context.
134 * Return: An XArray internal entry corresponding to this value.
135 */
136static inline void *xa_mk_internal(unsigned long v)
137{
138 return (void *)((v << 2) | 2);
139}
140
141/*
142 * xa_to_internal() - Extract the value from an internal entry.
143 * @entry: XArray entry.
144 *
145 * Context: Any context.
146 * Return: The value which was stored in the internal entry.
147 */
148static inline unsigned long xa_to_internal(const void *entry)
149{
150 return (unsigned long)entry >> 2;
151}
152
153/*
154 * xa_is_internal() - Is the entry an internal entry?
155 * @entry: XArray entry.
156 *
157 * Context: Any context.
158 * Return: %true if the entry is an internal entry.
159 */
160static inline bool xa_is_internal(const void *entry)
161{
162 return ((unsigned long)entry & 3) == 2;
163}
164
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -0500165/**
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500166 * xa_is_err() - Report whether an XArray operation returned an error
167 * @entry: Result from calling an XArray function
168 *
169 * If an XArray operation cannot complete an operation, it will return
170 * a special value indicating an error. This function tells you
171 * whether an error occurred; xa_err() tells you which error occurred.
172 *
173 * Context: Any context.
174 * Return: %true if the entry indicates an error.
175 */
176static inline bool xa_is_err(const void *entry)
177{
178 return unlikely(xa_is_internal(entry));
179}
180
181/**
182 * xa_err() - Turn an XArray result into an errno.
183 * @entry: Result from calling an XArray function.
184 *
185 * If an XArray operation cannot complete an operation, it will return
186 * a special pointer value which encodes an errno. This function extracts
187 * the errno from the pointer value, or returns 0 if the pointer does not
188 * represent an errno.
189 *
190 * Context: Any context.
191 * Return: A negative errno or 0.
192 */
193static inline int xa_err(void *entry)
194{
195 /* xa_to_internal() would not do sign extension. */
196 if (xa_is_err(entry))
197 return (long)entry >> 2;
198 return 0;
199}
200
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500201typedef unsigned __bitwise xa_mark_t;
202#define XA_MARK_0 ((__force xa_mark_t)0U)
203#define XA_MARK_1 ((__force xa_mark_t)1U)
204#define XA_MARK_2 ((__force xa_mark_t)2U)
205#define XA_PRESENT ((__force xa_mark_t)8U)
206#define XA_MARK_MAX XA_MARK_2
207
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500208enum xa_lock_type {
209 XA_LOCK_IRQ = 1,
210 XA_LOCK_BH = 2,
211};
212
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500213/*
214 * Values for xa_flags. The radix tree stores its GFP flags in the xa_flags,
215 * and we remain compatible with that.
216 */
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500217#define XA_FLAGS_LOCK_IRQ ((__force gfp_t)XA_LOCK_IRQ)
218#define XA_FLAGS_LOCK_BH ((__force gfp_t)XA_LOCK_BH)
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500219#define XA_FLAGS_MARK(mark) ((__force gfp_t)((1U << __GFP_BITS_SHIFT) << \
220 (__force unsigned)(mark)))
221
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500222/**
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -0500223 * struct xarray - The anchor of the XArray.
224 * @xa_lock: Lock that protects the contents of the XArray.
225 *
226 * To use the xarray, define it statically or embed it in your data structure.
227 * It is a very small data structure, so it does not usually make sense to
228 * allocate it separately and keep a pointer to it in your data structure.
229 *
230 * You may use the xa_lock to protect your own data structures as well.
231 */
232/*
233 * If all of the entries in the array are NULL, @xa_head is a NULL pointer.
234 * If the only non-NULL entry in the array is at index 0, @xa_head is that
235 * entry. If any other entry in the array is non-NULL, @xa_head points
236 * to an @xa_node.
237 */
238struct xarray {
239 spinlock_t xa_lock;
240/* private: The rest of the data structure is not to be used directly. */
241 gfp_t xa_flags;
242 void __rcu * xa_head;
243};
244
245#define XARRAY_INIT(name, flags) { \
246 .xa_lock = __SPIN_LOCK_UNLOCKED(name.xa_lock), \
247 .xa_flags = flags, \
248 .xa_head = NULL, \
249}
250
251/**
252 * DEFINE_XARRAY_FLAGS() - Define an XArray with custom flags.
253 * @name: A string that names your XArray.
254 * @flags: XA_FLAG values.
255 *
256 * This is intended for file scope definitions of XArrays. It declares
257 * and initialises an empty XArray with the chosen name and flags. It is
258 * equivalent to calling xa_init_flags() on the array, but it does the
259 * initialisation at compiletime instead of runtime.
260 */
261#define DEFINE_XARRAY_FLAGS(name, flags) \
262 struct xarray name = XARRAY_INIT(name, flags)
263
264/**
265 * DEFINE_XARRAY() - Define an XArray.
266 * @name: A string that names your XArray.
267 *
268 * This is intended for file scope definitions of XArrays. It declares
269 * and initialises an empty XArray with the chosen name. It is equivalent
270 * to calling xa_init() on the array, but it does the initialisation at
271 * compiletime instead of runtime.
272 */
273#define DEFINE_XARRAY(name) DEFINE_XARRAY_FLAGS(name, 0)
274
275void xa_init_flags(struct xarray *, gfp_t flags);
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500276void *xa_load(struct xarray *, unsigned long index);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500277void *xa_store(struct xarray *, unsigned long index, void *entry, gfp_t);
Matthew Wilcox41aec912017-11-10 15:34:55 -0500278void *xa_cmpxchg(struct xarray *, unsigned long index,
279 void *old, void *entry, gfp_t);
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500280bool xa_get_mark(struct xarray *, unsigned long index, xa_mark_t);
281void xa_set_mark(struct xarray *, unsigned long index, xa_mark_t);
282void xa_clear_mark(struct xarray *, unsigned long index, xa_mark_t);
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500283void *xa_find(struct xarray *xa, unsigned long *index,
284 unsigned long max, xa_mark_t) __attribute__((nonnull(2)));
285void *xa_find_after(struct xarray *xa, unsigned long *index,
286 unsigned long max, xa_mark_t) __attribute__((nonnull(2)));
Matthew Wilcox80a0a1a2017-11-14 16:42:22 -0500287unsigned int xa_extract(struct xarray *, void **dst, unsigned long start,
288 unsigned long max, unsigned int n, xa_mark_t);
Matthew Wilcox687149f2017-11-17 08:16:34 -0500289void xa_destroy(struct xarray *);
Matthew Wilcoxf8d5d0c2017-11-07 16:30:10 -0500290
291/**
292 * xa_init() - Initialise an empty XArray.
293 * @xa: XArray.
294 *
295 * An empty XArray is full of NULL entries.
296 *
297 * Context: Any context.
298 */
299static inline void xa_init(struct xarray *xa)
300{
301 xa_init_flags(xa, 0);
302}
303
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500304/**
305 * xa_empty() - Determine if an array has any present entries.
306 * @xa: XArray.
307 *
308 * Context: Any context.
309 * Return: %true if the array contains only NULL pointers.
310 */
311static inline bool xa_empty(const struct xarray *xa)
312{
313 return xa->xa_head == NULL;
314}
315
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500316/**
317 * xa_marked() - Inquire whether any entry in this array has a mark set
318 * @xa: Array
319 * @mark: Mark value
320 *
321 * Context: Any context.
322 * Return: %true if any entry has this mark set.
323 */
324static inline bool xa_marked(const struct xarray *xa, xa_mark_t mark)
325{
326 return xa->xa_flags & XA_FLAGS_MARK(mark);
327}
328
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500329/**
330 * xa_erase() - Erase this entry from the XArray.
331 * @xa: XArray.
332 * @index: Index of entry.
333 *
334 * This function is the equivalent of calling xa_store() with %NULL as
335 * the third argument. The XArray does not need to allocate memory, so
336 * the user does not need to provide GFP flags.
337 *
338 * Context: Process context. Takes and releases the xa_lock.
339 * Return: The entry which used to be at this index.
340 */
341static inline void *xa_erase(struct xarray *xa, unsigned long index)
342{
343 return xa_store(xa, index, NULL, 0);
344}
345
Matthew Wilcox41aec912017-11-10 15:34:55 -0500346/**
347 * xa_insert() - Store this entry in the XArray unless another entry is
348 * already present.
349 * @xa: XArray.
350 * @index: Index into array.
351 * @entry: New entry.
352 * @gfp: Memory allocation flags.
353 *
354 * If you would rather see the existing entry in the array, use xa_cmpxchg().
355 * This function is for users who don't care what the entry is, only that
356 * one is present.
357 *
358 * Context: Process context. Takes and releases the xa_lock.
359 * May sleep if the @gfp flags permit.
360 * Return: 0 if the store succeeded. -EEXIST if another entry was present.
361 * -ENOMEM if memory could not be allocated.
362 */
363static inline int xa_insert(struct xarray *xa, unsigned long index,
364 void *entry, gfp_t gfp)
365{
366 void *curr = xa_cmpxchg(xa, index, NULL, entry, gfp);
367 if (!curr)
368 return 0;
369 if (xa_is_err(curr))
370 return xa_err(curr);
371 return -EEXIST;
372}
373
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500374/**
375 * xa_for_each() - Iterate over a portion of an XArray.
376 * @xa: XArray.
377 * @entry: Entry retrieved from array.
378 * @index: Index of @entry.
379 * @max: Maximum index to retrieve from array.
380 * @filter: Selection criterion.
381 *
382 * Initialise @index to the lowest index you want to retrieve from the
383 * array. During the iteration, @entry will have the value of the entry
384 * stored in @xa at @index. The iteration will skip all entries in the
385 * array which do not match @filter. You may modify @index during the
386 * iteration if you want to skip or reprocess indices. It is safe to modify
387 * the array during the iteration. At the end of the iteration, @entry will
388 * be set to NULL and @index will have a value less than or equal to max.
389 *
390 * xa_for_each() is O(n.log(n)) while xas_for_each() is O(n). You have
391 * to handle your own locking with xas_for_each(), and if you have to unlock
392 * after each iteration, it will also end up being O(n.log(n)). xa_for_each()
393 * will spin if it hits a retry entry; if you intend to see retry entries,
394 * you should use the xas_for_each() iterator instead. The xas_for_each()
395 * iterator will expand into more inline code than xa_for_each().
396 *
397 * Context: Any context. Takes and releases the RCU lock.
398 */
399#define xa_for_each(xa, entry, index, max, filter) \
400 for (entry = xa_find(xa, &index, max, filter); entry; \
401 entry = xa_find_after(xa, &index, max, filter))
402
Matthew Wilcoxf6bb2a22018-04-10 16:36:52 -0700403#define xa_trylock(xa) spin_trylock(&(xa)->xa_lock)
404#define xa_lock(xa) spin_lock(&(xa)->xa_lock)
405#define xa_unlock(xa) spin_unlock(&(xa)->xa_lock)
406#define xa_lock_bh(xa) spin_lock_bh(&(xa)->xa_lock)
407#define xa_unlock_bh(xa) spin_unlock_bh(&(xa)->xa_lock)
408#define xa_lock_irq(xa) spin_lock_irq(&(xa)->xa_lock)
409#define xa_unlock_irq(xa) spin_unlock_irq(&(xa)->xa_lock)
410#define xa_lock_irqsave(xa, flags) \
411 spin_lock_irqsave(&(xa)->xa_lock, flags)
412#define xa_unlock_irqrestore(xa, flags) \
413 spin_unlock_irqrestore(&(xa)->xa_lock, flags)
414
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500415/*
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500416 * Versions of the normal API which require the caller to hold the
417 * xa_lock. If the GFP flags allow it, they will drop the lock to
418 * allocate memory, then reacquire it afterwards. These functions
419 * may also re-enable interrupts if the XArray flags indicate the
420 * locking should be interrupt safe.
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500421 */
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500422void *__xa_erase(struct xarray *, unsigned long index);
423void *__xa_store(struct xarray *, unsigned long index, void *entry, gfp_t);
Matthew Wilcox41aec912017-11-10 15:34:55 -0500424void *__xa_cmpxchg(struct xarray *, unsigned long index, void *old,
425 void *entry, gfp_t);
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500426void __xa_set_mark(struct xarray *, unsigned long index, xa_mark_t);
427void __xa_clear_mark(struct xarray *, unsigned long index, xa_mark_t);
428
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500429/**
Matthew Wilcox41aec912017-11-10 15:34:55 -0500430 * __xa_insert() - Store this entry in the XArray unless another entry is
431 * already present.
432 * @xa: XArray.
433 * @index: Index into array.
434 * @entry: New entry.
435 * @gfp: Memory allocation flags.
436 *
437 * If you would rather see the existing entry in the array, use __xa_cmpxchg().
438 * This function is for users who don't care what the entry is, only that
439 * one is present.
440 *
441 * Context: Any context. Expects xa_lock to be held on entry. May
442 * release and reacquire xa_lock if the @gfp flags permit.
443 * Return: 0 if the store succeeded. -EEXIST if another entry was present.
444 * -ENOMEM if memory could not be allocated.
445 */
446static inline int __xa_insert(struct xarray *xa, unsigned long index,
447 void *entry, gfp_t gfp)
448{
449 void *curr = __xa_cmpxchg(xa, index, NULL, entry, gfp);
450 if (!curr)
451 return 0;
452 if (xa_is_err(curr))
453 return xa_err(curr);
454 return -EEXIST;
455}
456
457/**
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500458 * xa_erase_bh() - Erase this entry from the XArray.
459 * @xa: XArray.
460 * @index: Index of entry.
461 *
462 * This function is the equivalent of calling xa_store() with %NULL as
463 * the third argument. The XArray does not need to allocate memory, so
464 * the user does not need to provide GFP flags.
465 *
466 * Context: Process context. Takes and releases the xa_lock while
467 * disabling softirqs.
468 * Return: The entry which used to be at this index.
469 */
470static inline void *xa_erase_bh(struct xarray *xa, unsigned long index)
471{
472 void *entry;
473
474 xa_lock_bh(xa);
475 entry = __xa_erase(xa, index);
476 xa_unlock_bh(xa);
477
478 return entry;
479}
480
481/**
482 * xa_erase_irq() - Erase this entry from the XArray.
483 * @xa: XArray.
484 * @index: Index of entry.
485 *
486 * This function is the equivalent of calling xa_store() with %NULL as
487 * the third argument. The XArray does not need to allocate memory, so
488 * the user does not need to provide GFP flags.
489 *
490 * Context: Process context. Takes and releases the xa_lock while
491 * disabling interrupts.
492 * Return: The entry which used to be at this index.
493 */
494static inline void *xa_erase_irq(struct xarray *xa, unsigned long index)
495{
496 void *entry;
497
498 xa_lock_irq(xa);
499 entry = __xa_erase(xa, index);
500 xa_unlock_irq(xa);
501
502 return entry;
503}
504
Matthew Wilcox02c02bf2017-11-03 23:09:45 -0400505/* Everything below here is the Advanced API. Proceed with caution. */
506
507/*
508 * The xarray is constructed out of a set of 'chunks' of pointers. Choosing
509 * the best chunk size requires some tradeoffs. A power of two recommends
510 * itself so that we can walk the tree based purely on shifts and masks.
511 * Generally, the larger the better; as the number of slots per level of the
512 * tree increases, the less tall the tree needs to be. But that needs to be
513 * balanced against the memory consumption of each node. On a 64-bit system,
514 * xa_node is currently 576 bytes, and we get 7 of them per 4kB page. If we
515 * doubled the number of slots per node, we'd get only 3 nodes per 4kB page.
516 */
517#ifndef XA_CHUNK_SHIFT
518#define XA_CHUNK_SHIFT (CONFIG_BASE_SMALL ? 4 : 6)
519#endif
520#define XA_CHUNK_SIZE (1UL << XA_CHUNK_SHIFT)
521#define XA_CHUNK_MASK (XA_CHUNK_SIZE - 1)
Matthew Wilcox01959df2017-11-09 09:23:56 -0500522#define XA_MAX_MARKS 3
523#define XA_MARK_LONGS DIV_ROUND_UP(XA_CHUNK_SIZE, BITS_PER_LONG)
524
525/*
526 * @count is the count of every non-NULL element in the ->slots array
527 * whether that is a value entry, a retry entry, a user pointer,
528 * a sibling entry or a pointer to the next level of the tree.
529 * @nr_values is the count of every element in ->slots which is
530 * either a value entry or a sibling of a value entry.
531 */
532struct xa_node {
533 unsigned char shift; /* Bits remaining in each slot */
534 unsigned char offset; /* Slot offset in parent */
535 unsigned char count; /* Total entry count */
536 unsigned char nr_values; /* Value entry count */
537 struct xa_node __rcu *parent; /* NULL at top of tree */
538 struct xarray *array; /* The array we belong to */
539 union {
540 struct list_head private_list; /* For tree user */
541 struct rcu_head rcu_head; /* Used when freeing node */
542 };
543 void __rcu *slots[XA_CHUNK_SIZE];
544 union {
545 unsigned long tags[XA_MAX_MARKS][XA_MARK_LONGS];
546 unsigned long marks[XA_MAX_MARKS][XA_MARK_LONGS];
547 };
548};
Matthew Wilcox02c02bf2017-11-03 23:09:45 -0400549
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500550void xa_dump(const struct xarray *);
551void xa_dump_node(const struct xa_node *);
552
553#ifdef XA_DEBUG
554#define XA_BUG_ON(xa, x) do { \
555 if (x) { \
556 xa_dump(xa); \
557 BUG(); \
558 } \
559 } while (0)
560#define XA_NODE_BUG_ON(node, x) do { \
561 if (x) { \
562 if (node) xa_dump_node(node); \
563 BUG(); \
564 } \
565 } while (0)
566#else
567#define XA_BUG_ON(xa, x) do { } while (0)
568#define XA_NODE_BUG_ON(node, x) do { } while (0)
569#endif
570
571/* Private */
572static inline void *xa_head(const struct xarray *xa)
573{
574 return rcu_dereference_check(xa->xa_head,
575 lockdep_is_held(&xa->xa_lock));
576}
577
578/* Private */
579static inline void *xa_head_locked(const struct xarray *xa)
580{
581 return rcu_dereference_protected(xa->xa_head,
582 lockdep_is_held(&xa->xa_lock));
583}
584
585/* Private */
586static inline void *xa_entry(const struct xarray *xa,
587 const struct xa_node *node, unsigned int offset)
588{
589 XA_NODE_BUG_ON(node, offset >= XA_CHUNK_SIZE);
590 return rcu_dereference_check(node->slots[offset],
591 lockdep_is_held(&xa->xa_lock));
592}
593
594/* Private */
595static inline void *xa_entry_locked(const struct xarray *xa,
596 const struct xa_node *node, unsigned int offset)
597{
598 XA_NODE_BUG_ON(node, offset >= XA_CHUNK_SIZE);
599 return rcu_dereference_protected(node->slots[offset],
600 lockdep_is_held(&xa->xa_lock));
601}
602
603/* Private */
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500604static inline struct xa_node *xa_parent(const struct xarray *xa,
605 const struct xa_node *node)
606{
607 return rcu_dereference_check(node->parent,
608 lockdep_is_held(&xa->xa_lock));
609}
610
611/* Private */
612static inline struct xa_node *xa_parent_locked(const struct xarray *xa,
613 const struct xa_node *node)
614{
615 return rcu_dereference_protected(node->parent,
616 lockdep_is_held(&xa->xa_lock));
617}
618
619/* Private */
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500620static inline void *xa_mk_node(const struct xa_node *node)
621{
622 return (void *)((unsigned long)node | 2);
623}
624
625/* Private */
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500626static inline struct xa_node *xa_to_node(const void *entry)
627{
628 return (struct xa_node *)((unsigned long)entry - 2);
629}
630
Matthew Wilcox02c02bf2017-11-03 23:09:45 -0400631/* Private */
632static inline bool xa_is_node(const void *entry)
633{
634 return xa_is_internal(entry) && (unsigned long)entry > 4096;
635}
636
637/* Private */
638static inline void *xa_mk_sibling(unsigned int offset)
639{
640 return xa_mk_internal(offset);
641}
642
643/* Private */
644static inline unsigned long xa_to_sibling(const void *entry)
645{
646 return xa_to_internal(entry);
647}
648
649/**
650 * xa_is_sibling() - Is the entry a sibling entry?
651 * @entry: Entry retrieved from the XArray
652 *
653 * Return: %true if the entry is a sibling entry.
654 */
655static inline bool xa_is_sibling(const void *entry)
656{
657 return IS_ENABLED(CONFIG_XARRAY_MULTI) && xa_is_internal(entry) &&
658 (entry < xa_mk_sibling(XA_CHUNK_SIZE - 1));
659}
660
661#define XA_RETRY_ENTRY xa_mk_internal(256)
662
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500663/**
664 * xa_is_retry() - Is the entry a retry entry?
665 * @entry: Entry retrieved from the XArray
666 *
667 * Return: %true if the entry is a retry entry.
668 */
669static inline bool xa_is_retry(const void *entry)
670{
671 return unlikely(entry == XA_RETRY_ENTRY);
672}
673
674/**
675 * typedef xa_update_node_t - A callback function from the XArray.
676 * @node: The node which is being processed
677 *
678 * This function is called every time the XArray updates the count of
679 * present and value entries in a node. It allows advanced users to
680 * maintain the private_list in the node.
681 *
682 * Context: The xa_lock is held and interrupts may be disabled.
683 * Implementations should not drop the xa_lock, nor re-enable
684 * interrupts.
685 */
686typedef void (*xa_update_node_t)(struct xa_node *node);
687
688/*
689 * The xa_state is opaque to its users. It contains various different pieces
690 * of state involved in the current operation on the XArray. It should be
691 * declared on the stack and passed between the various internal routines.
692 * The various elements in it should not be accessed directly, but only
693 * through the provided accessor functions. The below documentation is for
694 * the benefit of those working on the code, not for users of the XArray.
695 *
696 * @xa_node usually points to the xa_node containing the slot we're operating
697 * on (and @xa_offset is the offset in the slots array). If there is a
698 * single entry in the array at index 0, there are no allocated xa_nodes to
699 * point to, and so we store %NULL in @xa_node. @xa_node is set to
700 * the value %XAS_RESTART if the xa_state is not walked to the correct
701 * position in the tree of nodes for this operation. If an error occurs
702 * during an operation, it is set to an %XAS_ERROR value. If we run off the
703 * end of the allocated nodes, it is set to %XAS_BOUNDS.
704 */
705struct xa_state {
706 struct xarray *xa;
707 unsigned long xa_index;
708 unsigned char xa_shift;
709 unsigned char xa_sibs;
710 unsigned char xa_offset;
711 unsigned char xa_pad; /* Helps gcc generate better code */
712 struct xa_node *xa_node;
713 struct xa_node *xa_alloc;
714 xa_update_node_t xa_update;
715};
716
717/*
718 * We encode errnos in the xas->xa_node. If an error has happened, we need to
719 * drop the lock to fix it, and once we've done so the xa_state is invalid.
720 */
721#define XA_ERROR(errno) ((struct xa_node *)(((unsigned long)errno << 2) | 2UL))
722#define XAS_BOUNDS ((struct xa_node *)1UL)
723#define XAS_RESTART ((struct xa_node *)3UL)
724
725#define __XA_STATE(array, index, shift, sibs) { \
726 .xa = array, \
727 .xa_index = index, \
728 .xa_shift = shift, \
729 .xa_sibs = sibs, \
730 .xa_offset = 0, \
731 .xa_pad = 0, \
732 .xa_node = XAS_RESTART, \
733 .xa_alloc = NULL, \
734 .xa_update = NULL \
735}
736
737/**
738 * XA_STATE() - Declare an XArray operation state.
739 * @name: Name of this operation state (usually xas).
740 * @array: Array to operate on.
741 * @index: Initial index of interest.
742 *
743 * Declare and initialise an xa_state on the stack.
744 */
745#define XA_STATE(name, array, index) \
746 struct xa_state name = __XA_STATE(array, index, 0, 0)
747
748/**
749 * XA_STATE_ORDER() - Declare an XArray operation state.
750 * @name: Name of this operation state (usually xas).
751 * @array: Array to operate on.
752 * @index: Initial index of interest.
753 * @order: Order of entry.
754 *
755 * Declare and initialise an xa_state on the stack. This variant of
756 * XA_STATE() allows you to specify the 'order' of the element you
757 * want to operate on.`
758 */
759#define XA_STATE_ORDER(name, array, index, order) \
760 struct xa_state name = __XA_STATE(array, \
761 (index >> order) << order, \
762 order - (order % XA_CHUNK_SHIFT), \
763 (1U << (order % XA_CHUNK_SHIFT)) - 1)
764
765#define xas_marked(xas, mark) xa_marked((xas)->xa, (mark))
766#define xas_trylock(xas) xa_trylock((xas)->xa)
767#define xas_lock(xas) xa_lock((xas)->xa)
768#define xas_unlock(xas) xa_unlock((xas)->xa)
769#define xas_lock_bh(xas) xa_lock_bh((xas)->xa)
770#define xas_unlock_bh(xas) xa_unlock_bh((xas)->xa)
771#define xas_lock_irq(xas) xa_lock_irq((xas)->xa)
772#define xas_unlock_irq(xas) xa_unlock_irq((xas)->xa)
773#define xas_lock_irqsave(xas, flags) \
774 xa_lock_irqsave((xas)->xa, flags)
775#define xas_unlock_irqrestore(xas, flags) \
776 xa_unlock_irqrestore((xas)->xa, flags)
777
778/**
779 * xas_error() - Return an errno stored in the xa_state.
780 * @xas: XArray operation state.
781 *
782 * Return: 0 if no error has been noted. A negative errno if one has.
783 */
784static inline int xas_error(const struct xa_state *xas)
785{
786 return xa_err(xas->xa_node);
787}
788
789/**
790 * xas_set_err() - Note an error in the xa_state.
791 * @xas: XArray operation state.
792 * @err: Negative error number.
793 *
794 * Only call this function with a negative @err; zero or positive errors
795 * will probably not behave the way you think they should. If you want
796 * to clear the error from an xa_state, use xas_reset().
797 */
798static inline void xas_set_err(struct xa_state *xas, long err)
799{
800 xas->xa_node = XA_ERROR(err);
801}
802
803/**
804 * xas_invalid() - Is the xas in a retry or error state?
805 * @xas: XArray operation state.
806 *
807 * Return: %true if the xas cannot be used for operations.
808 */
809static inline bool xas_invalid(const struct xa_state *xas)
810{
811 return (unsigned long)xas->xa_node & 3;
812}
813
814/**
815 * xas_valid() - Is the xas a valid cursor into the array?
816 * @xas: XArray operation state.
817 *
818 * Return: %true if the xas can be used for operations.
819 */
820static inline bool xas_valid(const struct xa_state *xas)
821{
822 return !xas_invalid(xas);
823}
824
Matthew Wilcox2264f512017-12-04 00:11:48 -0500825/**
826 * xas_is_node() - Does the xas point to a node?
827 * @xas: XArray operation state.
828 *
829 * Return: %true if the xas currently references a node.
830 */
831static inline bool xas_is_node(const struct xa_state *xas)
832{
833 return xas_valid(xas) && xas->xa_node;
834}
835
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500836/* True if the pointer is something other than a node */
837static inline bool xas_not_node(struct xa_node *node)
838{
839 return ((unsigned long)node & 3) || !node;
840}
841
Matthew Wilcox64d3e9a2017-12-01 00:06:52 -0500842/* True if the node represents RESTART or an error */
843static inline bool xas_frozen(struct xa_node *node)
844{
845 return (unsigned long)node & 2;
846}
847
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500848/* True if the node represents head-of-tree, RESTART or BOUNDS */
849static inline bool xas_top(struct xa_node *node)
850{
851 return node <= XAS_RESTART;
852}
853
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500854/**
855 * xas_reset() - Reset an XArray operation state.
856 * @xas: XArray operation state.
857 *
858 * Resets the error or walk state of the @xas so future walks of the
859 * array will start from the root. Use this if you have dropped the
860 * xarray lock and want to reuse the xa_state.
861 *
862 * Context: Any context.
863 */
864static inline void xas_reset(struct xa_state *xas)
865{
866 xas->xa_node = XAS_RESTART;
867}
868
869/**
870 * xas_retry() - Retry the operation if appropriate.
871 * @xas: XArray operation state.
872 * @entry: Entry from xarray.
873 *
874 * The advanced functions may sometimes return an internal entry, such as
875 * a retry entry or a zero entry. This function sets up the @xas to restart
876 * the walk from the head of the array if needed.
877 *
878 * Context: Any context.
879 * Return: true if the operation needs to be retried.
880 */
881static inline bool xas_retry(struct xa_state *xas, const void *entry)
882{
883 if (!xa_is_retry(entry))
884 return false;
885 xas_reset(xas);
886 return true;
887}
888
889void *xas_load(struct xa_state *);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500890void *xas_store(struct xa_state *, void *entry);
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500891void *xas_find(struct xa_state *, unsigned long max);
Matthew Wilcox4e99d4e2018-06-01 22:46:02 -0400892void *xas_find_conflict(struct xa_state *);
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500893
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500894bool xas_get_mark(const struct xa_state *, xa_mark_t);
895void xas_set_mark(const struct xa_state *, xa_mark_t);
896void xas_clear_mark(const struct xa_state *, xa_mark_t);
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500897void *xas_find_marked(struct xa_state *, unsigned long max, xa_mark_t);
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500898void xas_init_marks(const struct xa_state *);
899
900bool xas_nomem(struct xa_state *, gfp_t);
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500901void xas_pause(struct xa_state *);
Matthew Wilcox9b89a032017-11-10 09:34:31 -0500902
Matthew Wilcox2264f512017-12-04 00:11:48 -0500903void xas_create_range(struct xa_state *);
904
Matthew Wilcoxad3d6c72017-11-07 14:57:46 -0500905/**
906 * xas_reload() - Refetch an entry from the xarray.
907 * @xas: XArray operation state.
908 *
909 * Use this function to check that a previously loaded entry still has
910 * the same value. This is useful for the lockless pagecache lookup where
911 * we walk the array with only the RCU lock to protect us, lock the page,
912 * then check that the page hasn't moved since we looked it up.
913 *
914 * The caller guarantees that @xas is still valid. If it may be in an
915 * error or restart state, call xas_load() instead.
916 *
917 * Return: The entry at this location in the xarray.
918 */
919static inline void *xas_reload(struct xa_state *xas)
920{
921 struct xa_node *node = xas->xa_node;
922
923 if (node)
924 return xa_entry(xas->xa, node, xas->xa_offset);
925 return xa_head(xas->xa);
926}
927
Matthew Wilcox58d6ea32017-11-10 15:15:08 -0500928/**
929 * xas_set() - Set up XArray operation state for a different index.
930 * @xas: XArray operation state.
931 * @index: New index into the XArray.
932 *
933 * Move the operation state to refer to a different index. This will
934 * have the effect of starting a walk from the top; see xas_next()
935 * to move to an adjacent index.
936 */
937static inline void xas_set(struct xa_state *xas, unsigned long index)
938{
939 xas->xa_index = index;
940 xas->xa_node = XAS_RESTART;
941}
942
943/**
944 * xas_set_order() - Set up XArray operation state for a multislot entry.
945 * @xas: XArray operation state.
946 * @index: Target of the operation.
947 * @order: Entry occupies 2^@order indices.
948 */
949static inline void xas_set_order(struct xa_state *xas, unsigned long index,
950 unsigned int order)
951{
952#ifdef CONFIG_XARRAY_MULTI
953 xas->xa_index = order < BITS_PER_LONG ? (index >> order) << order : 0;
954 xas->xa_shift = order - (order % XA_CHUNK_SHIFT);
955 xas->xa_sibs = (1 << (order % XA_CHUNK_SHIFT)) - 1;
956 xas->xa_node = XAS_RESTART;
957#else
958 BUG_ON(order > 0);
959 xas_set(xas, index);
960#endif
961}
962
963/**
964 * xas_set_update() - Set up XArray operation state for a callback.
965 * @xas: XArray operation state.
966 * @update: Function to call when updating a node.
967 *
968 * The XArray can notify a caller after it has updated an xa_node.
969 * This is advanced functionality and is only needed by the page cache.
970 */
971static inline void xas_set_update(struct xa_state *xas, xa_update_node_t update)
972{
973 xas->xa_update = update;
974}
975
Matthew Wilcoxb803b422017-11-14 08:30:11 -0500976/**
977 * xas_next_entry() - Advance iterator to next present entry.
978 * @xas: XArray operation state.
979 * @max: Highest index to return.
980 *
981 * xas_next_entry() is an inline function to optimise xarray traversal for
982 * speed. It is equivalent to calling xas_find(), and will call xas_find()
983 * for all the hard cases.
984 *
985 * Return: The next present entry after the one currently referred to by @xas.
986 */
987static inline void *xas_next_entry(struct xa_state *xas, unsigned long max)
988{
989 struct xa_node *node = xas->xa_node;
990 void *entry;
991
992 if (unlikely(xas_not_node(node) || node->shift ||
993 xas->xa_offset != (xas->xa_index & XA_CHUNK_MASK)))
994 return xas_find(xas, max);
995
996 do {
997 if (unlikely(xas->xa_index >= max))
998 return xas_find(xas, max);
999 if (unlikely(xas->xa_offset == XA_CHUNK_MASK))
1000 return xas_find(xas, max);
1001 entry = xa_entry(xas->xa, node, xas->xa_offset + 1);
1002 if (unlikely(xa_is_internal(entry)))
1003 return xas_find(xas, max);
1004 xas->xa_offset++;
1005 xas->xa_index++;
1006 } while (!entry);
1007
1008 return entry;
1009}
1010
1011/* Private */
1012static inline unsigned int xas_find_chunk(struct xa_state *xas, bool advance,
1013 xa_mark_t mark)
1014{
1015 unsigned long *addr = xas->xa_node->marks[(__force unsigned)mark];
1016 unsigned int offset = xas->xa_offset;
1017
1018 if (advance)
1019 offset++;
1020 if (XA_CHUNK_SIZE == BITS_PER_LONG) {
1021 if (offset < XA_CHUNK_SIZE) {
1022 unsigned long data = *addr & (~0UL << offset);
1023 if (data)
1024 return __ffs(data);
1025 }
1026 return XA_CHUNK_SIZE;
1027 }
1028
1029 return find_next_bit(addr, XA_CHUNK_SIZE, offset);
1030}
1031
1032/**
1033 * xas_next_marked() - Advance iterator to next marked entry.
1034 * @xas: XArray operation state.
1035 * @max: Highest index to return.
1036 * @mark: Mark to search for.
1037 *
1038 * xas_next_marked() is an inline function to optimise xarray traversal for
1039 * speed. It is equivalent to calling xas_find_marked(), and will call
1040 * xas_find_marked() for all the hard cases.
1041 *
1042 * Return: The next marked entry after the one currently referred to by @xas.
1043 */
1044static inline void *xas_next_marked(struct xa_state *xas, unsigned long max,
1045 xa_mark_t mark)
1046{
1047 struct xa_node *node = xas->xa_node;
1048 unsigned int offset;
1049
1050 if (unlikely(xas_not_node(node) || node->shift))
1051 return xas_find_marked(xas, max, mark);
1052 offset = xas_find_chunk(xas, true, mark);
1053 xas->xa_offset = offset;
1054 xas->xa_index = (xas->xa_index & ~XA_CHUNK_MASK) + offset;
1055 if (xas->xa_index > max)
1056 return NULL;
1057 if (offset == XA_CHUNK_SIZE)
1058 return xas_find_marked(xas, max, mark);
1059 return xa_entry(xas->xa, node, offset);
1060}
1061
1062/*
1063 * If iterating while holding a lock, drop the lock and reschedule
1064 * every %XA_CHECK_SCHED loops.
1065 */
1066enum {
1067 XA_CHECK_SCHED = 4096,
1068};
1069
1070/**
1071 * xas_for_each() - Iterate over a range of an XArray.
1072 * @xas: XArray operation state.
1073 * @entry: Entry retrieved from the array.
1074 * @max: Maximum index to retrieve from array.
1075 *
1076 * The loop body will be executed for each entry present in the xarray
1077 * between the current xas position and @max. @entry will be set to
1078 * the entry retrieved from the xarray. It is safe to delete entries
1079 * from the array in the loop body. You should hold either the RCU lock
1080 * or the xa_lock while iterating. If you need to drop the lock, call
1081 * xas_pause() first.
1082 */
1083#define xas_for_each(xas, entry, max) \
1084 for (entry = xas_find(xas, max); entry; \
1085 entry = xas_next_entry(xas, max))
1086
1087/**
1088 * xas_for_each_marked() - Iterate over a range of an XArray.
1089 * @xas: XArray operation state.
1090 * @entry: Entry retrieved from the array.
1091 * @max: Maximum index to retrieve from array.
1092 * @mark: Mark to search for.
1093 *
1094 * The loop body will be executed for each marked entry in the xarray
1095 * between the current xas position and @max. @entry will be set to
1096 * the entry retrieved from the xarray. It is safe to delete entries
1097 * from the array in the loop body. You should hold either the RCU lock
1098 * or the xa_lock while iterating. If you need to drop the lock, call
1099 * xas_pause() first.
1100 */
1101#define xas_for_each_marked(xas, entry, max, mark) \
1102 for (entry = xas_find_marked(xas, max, mark); entry; \
1103 entry = xas_next_marked(xas, max, mark))
1104
Matthew Wilcox4e99d4e2018-06-01 22:46:02 -04001105/**
1106 * xas_for_each_conflict() - Iterate over a range of an XArray.
1107 * @xas: XArray operation state.
1108 * @entry: Entry retrieved from the array.
1109 *
1110 * The loop body will be executed for each entry in the XArray that lies
1111 * within the range specified by @xas. If the loop completes successfully,
1112 * any entries that lie in this range will be replaced by @entry. The caller
1113 * may break out of the loop; if they do so, the contents of the XArray will
1114 * be unchanged. The operation may fail due to an out of memory condition.
1115 * The caller may also call xa_set_err() to exit the loop while setting an
1116 * error to record the reason.
1117 */
1118#define xas_for_each_conflict(xas, entry) \
1119 while ((entry = xas_find_conflict(xas)))
1120
Matthew Wilcox64d3e9a2017-12-01 00:06:52 -05001121void *__xas_next(struct xa_state *);
1122void *__xas_prev(struct xa_state *);
1123
1124/**
1125 * xas_prev() - Move iterator to previous index.
1126 * @xas: XArray operation state.
1127 *
1128 * If the @xas was in an error state, it will remain in an error state
1129 * and this function will return %NULL. If the @xas has never been walked,
1130 * it will have the effect of calling xas_load(). Otherwise one will be
1131 * subtracted from the index and the state will be walked to the correct
1132 * location in the array for the next operation.
1133 *
1134 * If the iterator was referencing index 0, this function wraps
1135 * around to %ULONG_MAX.
1136 *
1137 * Return: The entry at the new index. This may be %NULL or an internal
1138 * entry.
1139 */
1140static inline void *xas_prev(struct xa_state *xas)
1141{
1142 struct xa_node *node = xas->xa_node;
1143
1144 if (unlikely(xas_not_node(node) || node->shift ||
1145 xas->xa_offset == 0))
1146 return __xas_prev(xas);
1147
1148 xas->xa_index--;
1149 xas->xa_offset--;
1150 return xa_entry(xas->xa, node, xas->xa_offset);
1151}
1152
1153/**
1154 * xas_next() - Move state to next index.
1155 * @xas: XArray operation state.
1156 *
1157 * If the @xas was in an error state, it will remain in an error state
1158 * and this function will return %NULL. If the @xas has never been walked,
1159 * it will have the effect of calling xas_load(). Otherwise one will be
1160 * added to the index and the state will be walked to the correct
1161 * location in the array for the next operation.
1162 *
1163 * If the iterator was referencing index %ULONG_MAX, this function wraps
1164 * around to 0.
1165 *
1166 * Return: The entry at the new index. This may be %NULL or an internal
1167 * entry.
1168 */
1169static inline void *xas_next(struct xa_state *xas)
1170{
1171 struct xa_node *node = xas->xa_node;
1172
1173 if (unlikely(xas_not_node(node) || node->shift ||
1174 xas->xa_offset == XA_CHUNK_MASK))
1175 return __xas_next(xas);
1176
1177 xas->xa_index++;
1178 xas->xa_offset++;
1179 return xa_entry(xas->xa, node, xas->xa_offset);
1180}
1181
Matthew Wilcoxf6bb2a22018-04-10 16:36:52 -07001182#endif /* _LINUX_XARRAY_H */