Blame view

lib/radix-tree.c 52.6 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
  /*
   * Copyright (C) 2001 Momchil Velikov
   * Portions Copyright (C) 2001 Christoph Hellwig
cde535359   Christoph Lameter   Christoph has moved
4
   * Copyright (C) 2005 SGI, Christoph Lameter
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
5
   * Copyright (C) 2006 Nick Piggin
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
6
   * Copyright (C) 2012 Konstantin Khlebnikov
6b053b8e5   Matthew Wilcox   radix-tree: add c...
7
8
   * Copyright (C) 2016 Intel, Matthew Wilcox
   * Copyright (C) 2016 Intel, Ross Zwisler
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
   *
   * This program is free software; you can redistribute it and/or
   * modify it under the terms of the GNU General Public License as
   * published by the Free Software Foundation; either version 2, or (at
   * your option) any later version.
   *
   * This program is distributed in the hope that it will be useful, but
   * WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   * General Public License for more details.
   *
   * You should have received a copy of the GNU General Public License
   * along with this program; if not, write to the Free Software
   * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
   */
e157b5559   Matthew Wilcox   radix-tree: add r...
24
  #include <linux/cpu.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
25
26
27
  #include <linux/errno.h>
  #include <linux/init.h>
  #include <linux/kernel.h>
8bc3bcc93   Paul Gortmaker   lib: reduce the u...
28
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
29
30
31
  #include <linux/radix-tree.h>
  #include <linux/percpu.h>
  #include <linux/slab.h>
ce80b067d   Catalin Marinas   lib/radix-tree.c:...
32
  #include <linux/kmemleak.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
33
  #include <linux/cpu.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
34
35
  #include <linux/string.h>
  #include <linux/bitops.h>
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
36
  #include <linux/rcupdate.h>
92cf21187   Frederic Weisbecker   sched/preempt: Me...
37
  #include <linux/preempt.h>		/* in_interrupt() */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
38

c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
39
40
  /* Number of nodes in fully populated tree of given height */
  static unsigned long height_to_maxnodes[RADIX_TREE_MAX_PATH + 1] __read_mostly;
26fb1589c   Jeff Moyer   fix the max path ...
41
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
42
43
   * Radix tree node cache.
   */
e18b890bb   Christoph Lameter   [PATCH] slab: rem...
44
  static struct kmem_cache *radix_tree_node_cachep;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
45
46
  
  /*
553680529   Nick Piggin   radix-tree: fix p...
47
48
49
50
51
52
53
54
55
56
57
58
59
   * The radix tree is variable-height, so an insert operation not only has
   * to build the branch to its corresponding item, it also has to build the
   * branch to existing items if the size has to be increased (by
   * radix_tree_extend).
   *
   * The worst case is a zero height tree with just a single item at index 0,
   * and then inserting an item at index ULONG_MAX. This requires 2 new branches
   * of RADIX_TREE_MAX_PATH size to be created, with only the root node shared.
   * Hence:
   */
  #define RADIX_TREE_PRELOAD_SIZE (RADIX_TREE_MAX_PATH * 2 - 1)
  
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
60
61
62
   * Per-cpu pool of preloaded nodes
   */
  struct radix_tree_preload {
2fcd9005c   Matthew Wilcox   radix-tree: misce...
63
  	unsigned nr;
9d2a8da00   Kirill A. Shutemov   radix-tree: repla...
64
65
  	/* nodes->private_data points to next preallocated node */
  	struct radix_tree_node *nodes;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
66
  };
8cef7d57a   Harvey Harrison   lib: radix_tree.c...
67
  static DEFINE_PER_CPU(struct radix_tree_preload, radix_tree_preloads) = { 0, };
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
68

148deab22   Matthew Wilcox   radix-tree: impro...
69
70
71
72
  static inline struct radix_tree_node *entry_to_node(void *ptr)
  {
  	return (void *)((unsigned long)ptr & ~RADIX_TREE_INTERNAL_NODE);
  }
a4db4dcea   Matthew Wilcox   radix-tree: renam...
73
  static inline void *node_to_entry(void *ptr)
27d20fddc   Nick Piggin   radix-tree: fix R...
74
  {
30ff46ccb   Matthew Wilcox   radix-tree: renam...
75
  	return (void *)((unsigned long)ptr | RADIX_TREE_INTERNAL_NODE);
27d20fddc   Nick Piggin   radix-tree: fix R...
76
  }
a4db4dcea   Matthew Wilcox   radix-tree: renam...
77
  #define RADIX_TREE_RETRY	node_to_entry(NULL)
afe0e395b   Matthew Wilcox   radix-tree: fix s...
78

db050f292   Matthew Wilcox   radix-tree: add m...
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  /* Sibling slots point directly to another slot in the same node */
  static inline bool is_sibling_entry(struct radix_tree_node *parent, void *node)
  {
  	void **ptr = node;
  	return (parent->slots <= ptr) &&
  			(ptr < parent->slots + RADIX_TREE_MAP_SIZE);
  }
  #else
  static inline bool is_sibling_entry(struct radix_tree_node *parent, void *node)
  {
  	return false;
  }
  #endif
  
  static inline unsigned long get_slot_offset(struct radix_tree_node *parent,
  						 void **slot)
  {
  	return slot - parent->slots;
  }
9e85d8111   Matthew Wilcox   radix-tree: make ...
99
100
  static unsigned int radix_tree_descend(struct radix_tree_node *parent,
  			struct radix_tree_node **nodep, unsigned long index)
db050f292   Matthew Wilcox   radix-tree: add m...
101
  {
9e85d8111   Matthew Wilcox   radix-tree: make ...
102
  	unsigned int offset = (index >> parent->shift) & RADIX_TREE_MAP_MASK;
db050f292   Matthew Wilcox   radix-tree: add m...
103
104
105
  	void **entry = rcu_dereference_raw(parent->slots[offset]);
  
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
b194d16c2   Matthew Wilcox   radix-tree: renam...
106
  	if (radix_tree_is_internal_node(entry)) {
8d2c0d36d   Linus Torvalds   radix tree: fix s...
107
108
109
110
  		if (is_sibling_entry(parent, entry)) {
  			void **sibentry = (void **) entry_to_node(entry);
  			offset = get_slot_offset(parent, sibentry);
  			entry = rcu_dereference_raw(*sibentry);
db050f292   Matthew Wilcox   radix-tree: add m...
111
112
113
114
115
116
117
  		}
  	}
  #endif
  
  	*nodep = (void *)entry;
  	return offset;
  }
612d6c19d   Nick Piggin   [PATCH] radix-tre...
118
119
120
121
  static inline gfp_t root_gfp_mask(struct radix_tree_root *root)
  {
  	return root->gfp_mask & __GFP_BITS_MASK;
  }
643b52b9c   Nick Piggin   radix-tree: fix s...
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
  static inline void tag_set(struct radix_tree_node *node, unsigned int tag,
  		int offset)
  {
  	__set_bit(offset, node->tags[tag]);
  }
  
  static inline void tag_clear(struct radix_tree_node *node, unsigned int tag,
  		int offset)
  {
  	__clear_bit(offset, node->tags[tag]);
  }
  
  static inline int tag_get(struct radix_tree_node *node, unsigned int tag,
  		int offset)
  {
  	return test_bit(offset, node->tags[tag]);
  }
  
  static inline void root_tag_set(struct radix_tree_root *root, unsigned int tag)
  {
  	root->gfp_mask |= (__force gfp_t)(1 << (tag + __GFP_BITS_SHIFT));
  }
2fcd9005c   Matthew Wilcox   radix-tree: misce...
144
  static inline void root_tag_clear(struct radix_tree_root *root, unsigned tag)
643b52b9c   Nick Piggin   radix-tree: fix s...
145
146
147
148
149
150
151
152
153
154
155
  {
  	root->gfp_mask &= (__force gfp_t)~(1 << (tag + __GFP_BITS_SHIFT));
  }
  
  static inline void root_tag_clear_all(struct radix_tree_root *root)
  {
  	root->gfp_mask &= __GFP_BITS_MASK;
  }
  
  static inline int root_tag_get(struct radix_tree_root *root, unsigned int tag)
  {
2fcd9005c   Matthew Wilcox   radix-tree: misce...
156
  	return (__force int)root->gfp_mask & (1 << (tag + __GFP_BITS_SHIFT));
643b52b9c   Nick Piggin   radix-tree: fix s...
157
  }
7b60e9ad5   Matthew Wilcox   radix-tree: fix m...
158
159
160
161
  static inline unsigned root_tags_get(struct radix_tree_root *root)
  {
  	return (__force unsigned)root->gfp_mask >> __GFP_BITS_SHIFT;
  }
643b52b9c   Nick Piggin   radix-tree: fix s...
162
163
164
165
166
167
  /*
   * Returns 1 if any slot in the node has this tag set.
   * Otherwise returns 0.
   */
  static inline int any_tag_set(struct radix_tree_node *node, unsigned int tag)
  {
2fcd9005c   Matthew Wilcox   radix-tree: misce...
168
  	unsigned idx;
643b52b9c   Nick Piggin   radix-tree: fix s...
169
170
171
172
173
174
  	for (idx = 0; idx < RADIX_TREE_TAG_LONGS; idx++) {
  		if (node->tags[tag][idx])
  			return 1;
  	}
  	return 0;
  }
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
175
176
177
178
179
180
181
182
183
184
185
186
187
  
  /**
   * radix_tree_find_next_bit - find the next set bit in a memory region
   *
   * @addr: The address to base the search on
   * @size: The bitmap size in bits
   * @offset: The bitnumber to start searching at
   *
   * Unrollable variant of find_next_bit() for constant size arrays.
   * Tail bits starting from size to roundup(size, BITS_PER_LONG) must be zero.
   * Returns next bit offset, or size if nothing found.
   */
  static __always_inline unsigned long
bc412fca6   Matthew Wilcox   radix-tree: make ...
188
189
  radix_tree_find_next_bit(struct radix_tree_node *node, unsigned int tag,
  			 unsigned long offset)
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
190
  {
bc412fca6   Matthew Wilcox   radix-tree: make ...
191
  	const unsigned long *addr = node->tags[tag];
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
192

bc412fca6   Matthew Wilcox   radix-tree: make ...
193
  	if (offset < RADIX_TREE_MAP_SIZE) {
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
194
195
196
197
198
199
200
  		unsigned long tmp;
  
  		addr += offset / BITS_PER_LONG;
  		tmp = *addr >> (offset % BITS_PER_LONG);
  		if (tmp)
  			return __ffs(tmp) + offset;
  		offset = (offset + BITS_PER_LONG) & ~(BITS_PER_LONG - 1);
bc412fca6   Matthew Wilcox   radix-tree: make ...
201
  		while (offset < RADIX_TREE_MAP_SIZE) {
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
202
203
204
205
206
207
  			tmp = *++addr;
  			if (tmp)
  				return __ffs(tmp) + offset;
  			offset += BITS_PER_LONG;
  		}
  	}
bc412fca6   Matthew Wilcox   radix-tree: make ...
208
  	return RADIX_TREE_MAP_SIZE;
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
209
  }
268f42de7   Matthew Wilcox   radix-tree: delet...
210
211
212
213
  static unsigned int iter_offset(const struct radix_tree_iter *iter)
  {
  	return (iter->index >> iter_shift(iter)) & RADIX_TREE_MAP_MASK;
  }
218ed7503   Matthew Wilcox   radix-tree: impro...
214
215
216
217
218
219
220
221
222
223
224
225
  /*
   * The maximum index which can be stored in a radix tree
   */
  static inline unsigned long shift_maxindex(unsigned int shift)
  {
  	return (RADIX_TREE_MAP_SIZE << shift) - 1;
  }
  
  static inline unsigned long node_maxindex(struct radix_tree_node *node)
  {
  	return shift_maxindex(node->shift);
  }
0796c5832   Ross Zwisler   radix-tree: fix r...
226
  #ifndef __KERNEL__
d0891265b   Matthew Wilcox   radix-tree: remov...
227
  static void dump_node(struct radix_tree_node *node, unsigned long index)
7cf19af4d   Matthew Wilcox   radix_tree: add r...
228
  {
0796c5832   Ross Zwisler   radix-tree: fix r...
229
  	unsigned long i;
7cf19af4d   Matthew Wilcox   radix_tree: add r...
230

218ed7503   Matthew Wilcox   radix-tree: impro...
231
232
233
234
  	pr_debug("radix node: %p offset %d indices %lu-%lu parent %p tags %lx %lx %lx shift %d count %d exceptional %d
  ",
  		node, node->offset, index, index | node_maxindex(node),
  		node->parent,
0796c5832   Ross Zwisler   radix-tree: fix r...
235
  		node->tags[0][0], node->tags[1][0], node->tags[2][0],
218ed7503   Matthew Wilcox   radix-tree: impro...
236
  		node->shift, node->count, node->exceptional);
0796c5832   Ross Zwisler   radix-tree: fix r...
237
238
  
  	for (i = 0; i < RADIX_TREE_MAP_SIZE; i++) {
d0891265b   Matthew Wilcox   radix-tree: remov...
239
240
  		unsigned long first = index | (i << node->shift);
  		unsigned long last = first | ((1UL << node->shift) - 1);
0796c5832   Ross Zwisler   radix-tree: fix r...
241
242
243
  		void *entry = node->slots[i];
  		if (!entry)
  			continue;
218ed7503   Matthew Wilcox   radix-tree: impro...
244
245
246
247
  		if (entry == RADIX_TREE_RETRY) {
  			pr_debug("radix retry offset %ld indices %lu-%lu parent %p
  ",
  					i, first, last, node);
b194d16c2   Matthew Wilcox   radix-tree: renam...
248
  		} else if (!radix_tree_is_internal_node(entry)) {
218ed7503   Matthew Wilcox   radix-tree: impro...
249
250
251
252
253
254
255
256
  			pr_debug("radix entry %p offset %ld indices %lu-%lu parent %p
  ",
  					entry, i, first, last, node);
  		} else if (is_sibling_entry(node, entry)) {
  			pr_debug("radix sblng %p offset %ld indices %lu-%lu parent %p val %p
  ",
  					entry, i, first, last, node,
  					*(void **)entry_to_node(entry));
0796c5832   Ross Zwisler   radix-tree: fix r...
257
  		} else {
4dd6c0987   Matthew Wilcox   radix-tree: renam...
258
  			dump_node(entry_to_node(entry), first);
0796c5832   Ross Zwisler   radix-tree: fix r...
259
260
  		}
  	}
7cf19af4d   Matthew Wilcox   radix_tree: add r...
261
262
263
264
265
  }
  
  /* For debug */
  static void radix_tree_dump(struct radix_tree_root *root)
  {
d0891265b   Matthew Wilcox   radix-tree: remov...
266
267
268
  	pr_debug("radix root: %p rnode %p tags %x
  ",
  			root, root->rnode,
7cf19af4d   Matthew Wilcox   radix_tree: add r...
269
  			root->gfp_mask >> __GFP_BITS_SHIFT);
b194d16c2   Matthew Wilcox   radix-tree: renam...
270
  	if (!radix_tree_is_internal_node(root->rnode))
7cf19af4d   Matthew Wilcox   radix_tree: add r...
271
  		return;
4dd6c0987   Matthew Wilcox   radix-tree: renam...
272
  	dump_node(entry_to_node(root->rnode), 0);
7cf19af4d   Matthew Wilcox   radix_tree: add r...
273
274
  }
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
275
276
277
278
279
  /*
   * This assumes that the caller has performed appropriate preallocation, and
   * that the caller has pinned this thread of control to the current CPU.
   */
  static struct radix_tree_node *
e8de43407   Matthew Wilcox   radix-tree: ensur...
280
281
282
283
  radix_tree_node_alloc(struct radix_tree_root *root,
  			struct radix_tree_node *parent,
  			unsigned int shift, unsigned int offset,
  			unsigned int count, unsigned int exceptional)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
284
  {
e2848a0ef   Nick Piggin   radix-tree: avoid...
285
  	struct radix_tree_node *ret = NULL;
612d6c19d   Nick Piggin   [PATCH] radix-tre...
286
  	gfp_t gfp_mask = root_gfp_mask(root);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
287

5e4c0d974   Jan Kara   lib/radix-tree.c:...
288
  	/*
2fcd9005c   Matthew Wilcox   radix-tree: misce...
289
290
291
  	 * Preload code isn't irq safe and it doesn't make sense to use
  	 * preloading during an interrupt anyway as all the allocations have
  	 * to be atomic. So just do normal allocation when in interrupt.
5e4c0d974   Jan Kara   lib/radix-tree.c:...
292
  	 */
d0164adc8   Mel Gorman   mm, page_alloc: d...
293
  	if (!gfpflags_allow_blocking(gfp_mask) && !in_interrupt()) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
294
  		struct radix_tree_preload *rtp;
e2848a0ef   Nick Piggin   radix-tree: avoid...
295
  		/*
58e698af4   Vladimir Davydov   radix-tree: accou...
296
  		 * Even if the caller has preloaded, try to allocate from the
05eb6e726   Vladimir Davydov   radix-tree: accou...
297
298
  		 * cache first for the new node to get accounted to the memory
  		 * cgroup.
58e698af4   Vladimir Davydov   radix-tree: accou...
299
300
  		 */
  		ret = kmem_cache_alloc(radix_tree_node_cachep,
05eb6e726   Vladimir Davydov   radix-tree: accou...
301
  				       gfp_mask | __GFP_NOWARN);
58e698af4   Vladimir Davydov   radix-tree: accou...
302
303
304
305
  		if (ret)
  			goto out;
  
  		/*
e2848a0ef   Nick Piggin   radix-tree: avoid...
306
307
308
309
  		 * Provided the caller has preloaded here, we will always
  		 * succeed in getting a node here (and never reach
  		 * kmem_cache_alloc)
  		 */
7c8e0181e   Christoph Lameter   mm: replace __get...
310
  		rtp = this_cpu_ptr(&radix_tree_preloads);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
311
  		if (rtp->nr) {
9d2a8da00   Kirill A. Shutemov   radix-tree: repla...
312
313
314
  			ret = rtp->nodes;
  			rtp->nodes = ret->private_data;
  			ret->private_data = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
315
316
  			rtp->nr--;
  		}
ce80b067d   Catalin Marinas   lib/radix-tree.c:...
317
318
319
320
321
  		/*
  		 * Update the allocation stack trace as this is more useful
  		 * for debugging.
  		 */
  		kmemleak_update_trace(ret);
58e698af4   Vladimir Davydov   radix-tree: accou...
322
  		goto out;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
323
  	}
05eb6e726   Vladimir Davydov   radix-tree: accou...
324
  	ret = kmem_cache_alloc(radix_tree_node_cachep, gfp_mask);
58e698af4   Vladimir Davydov   radix-tree: accou...
325
  out:
b194d16c2   Matthew Wilcox   radix-tree: renam...
326
  	BUG_ON(radix_tree_is_internal_node(ret));
e8de43407   Matthew Wilcox   radix-tree: ensur...
327
328
329
330
331
332
333
  	if (ret) {
  		ret->parent = parent;
  		ret->shift = shift;
  		ret->offset = offset;
  		ret->count = count;
  		ret->exceptional = exceptional;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
334
335
  	return ret;
  }
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
336
337
338
339
  static void radix_tree_node_rcu_free(struct rcu_head *head)
  {
  	struct radix_tree_node *node =
  			container_of(head, struct radix_tree_node, rcu_head);
643b52b9c   Nick Piggin   radix-tree: fix s...
340
341
  
  	/*
175542f57   Matthew Wilcox   radix-tree: add r...
342
343
344
  	 * Must only free zeroed nodes into the slab.  We can be left with
  	 * non-NULL entries by radix_tree_free_nodes, so clear the entries
  	 * and tags here.
643b52b9c   Nick Piggin   radix-tree: fix s...
345
  	 */
175542f57   Matthew Wilcox   radix-tree: add r...
346
347
  	memset(node->slots, 0, sizeof(node->slots));
  	memset(node->tags, 0, sizeof(node->tags));
91d9c05ac   Matthew Wilcox   radix-tree: move ...
348
  	INIT_LIST_HEAD(&node->private_list);
643b52b9c   Nick Piggin   radix-tree: fix s...
349

7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
350
351
  	kmem_cache_free(radix_tree_node_cachep, node);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
352
353
354
  static inline void
  radix_tree_node_free(struct radix_tree_node *node)
  {
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
355
  	call_rcu(&node->rcu_head, radix_tree_node_rcu_free);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
356
357
358
359
360
361
362
  }
  
  /*
   * Load up this CPU's radix_tree_node buffer with sufficient objects to
   * ensure that the addition of a single element in the tree cannot fail.  On
   * success, return zero, with preemption disabled.  On error, return -ENOMEM
   * with preemption not disabled.
b34df792b   David Howells   FS-Cache: Use rad...
363
364
   *
   * To make use of this facility, the radix tree must be initialised without
d0164adc8   Mel Gorman   mm, page_alloc: d...
365
   * __GFP_DIRECT_RECLAIM being passed to INIT_RADIX_TREE().
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
366
   */
2791653a6   Matthew Wilcox   radix-tree: add r...
367
  static int __radix_tree_preload(gfp_t gfp_mask, unsigned nr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
368
369
370
371
  {
  	struct radix_tree_preload *rtp;
  	struct radix_tree_node *node;
  	int ret = -ENOMEM;
05eb6e726   Vladimir Davydov   radix-tree: accou...
372
373
374
375
376
  	/*
  	 * Nodes preloaded by one cgroup can be be used by another cgroup, so
  	 * they should never be accounted to any particular memory cgroup.
  	 */
  	gfp_mask &= ~__GFP_ACCOUNT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
377
  	preempt_disable();
7c8e0181e   Christoph Lameter   mm: replace __get...
378
  	rtp = this_cpu_ptr(&radix_tree_preloads);
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
379
  	while (rtp->nr < nr) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
380
  		preempt_enable();
488514d17   Christoph Lameter   Remove set_migrat...
381
  		node = kmem_cache_alloc(radix_tree_node_cachep, gfp_mask);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
382
383
384
  		if (node == NULL)
  			goto out;
  		preempt_disable();
7c8e0181e   Christoph Lameter   mm: replace __get...
385
  		rtp = this_cpu_ptr(&radix_tree_preloads);
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
386
  		if (rtp->nr < nr) {
9d2a8da00   Kirill A. Shutemov   radix-tree: repla...
387
388
389
390
  			node->private_data = rtp->nodes;
  			rtp->nodes = node;
  			rtp->nr++;
  		} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
391
  			kmem_cache_free(radix_tree_node_cachep, node);
9d2a8da00   Kirill A. Shutemov   radix-tree: repla...
392
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
393
394
395
396
397
  	}
  	ret = 0;
  out:
  	return ret;
  }
5e4c0d974   Jan Kara   lib/radix-tree.c:...
398
399
400
401
402
403
404
405
  
  /*
   * Load up this CPU's radix_tree_node buffer with sufficient objects to
   * ensure that the addition of a single element in the tree cannot fail.  On
   * success, return zero, with preemption disabled.  On error, return -ENOMEM
   * with preemption not disabled.
   *
   * To make use of this facility, the radix tree must be initialised without
d0164adc8   Mel Gorman   mm, page_alloc: d...
406
   * __GFP_DIRECT_RECLAIM being passed to INIT_RADIX_TREE().
5e4c0d974   Jan Kara   lib/radix-tree.c:...
407
408
409
410
   */
  int radix_tree_preload(gfp_t gfp_mask)
  {
  	/* Warn on non-sensical use... */
d0164adc8   Mel Gorman   mm, page_alloc: d...
411
  	WARN_ON_ONCE(!gfpflags_allow_blocking(gfp_mask));
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
412
  	return __radix_tree_preload(gfp_mask, RADIX_TREE_PRELOAD_SIZE);
5e4c0d974   Jan Kara   lib/radix-tree.c:...
413
  }
d7f0923d8   David Chinner   [LIB]: export rad...
414
  EXPORT_SYMBOL(radix_tree_preload);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
415

6e954b9e9   Nick Piggin   [PATCH] radix tre...
416
  /*
5e4c0d974   Jan Kara   lib/radix-tree.c:...
417
418
419
420
421
422
   * The same as above function, except we don't guarantee preloading happens.
   * We do it, if we decide it helps. On success, return zero with preemption
   * disabled. On error, return -ENOMEM with preemption not disabled.
   */
  int radix_tree_maybe_preload(gfp_t gfp_mask)
  {
d0164adc8   Mel Gorman   mm, page_alloc: d...
423
  	if (gfpflags_allow_blocking(gfp_mask))
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
424
  		return __radix_tree_preload(gfp_mask, RADIX_TREE_PRELOAD_SIZE);
5e4c0d974   Jan Kara   lib/radix-tree.c:...
425
426
427
428
429
  	/* Preloading doesn't help anything with this gfp mask, skip it */
  	preempt_disable();
  	return 0;
  }
  EXPORT_SYMBOL(radix_tree_maybe_preload);
2791653a6   Matthew Wilcox   radix-tree: add r...
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  /*
   * Preload with enough objects to ensure that we can split a single entry
   * of order @old_order into many entries of size @new_order
   */
  int radix_tree_split_preload(unsigned int old_order, unsigned int new_order,
  							gfp_t gfp_mask)
  {
  	unsigned top = 1 << (old_order % RADIX_TREE_MAP_SHIFT);
  	unsigned layers = (old_order / RADIX_TREE_MAP_SHIFT) -
  				(new_order / RADIX_TREE_MAP_SHIFT);
  	unsigned nr = 0;
  
  	WARN_ON_ONCE(!gfpflags_allow_blocking(gfp_mask));
  	BUG_ON(new_order >= old_order);
  
  	while (layers--)
  		nr = nr * RADIX_TREE_MAP_SIZE + 1;
  	return __radix_tree_preload(gfp_mask, top * nr);
  }
  #endif
5e4c0d974   Jan Kara   lib/radix-tree.c:...
451
  /*
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
   * The same as function above, but preload number of nodes required to insert
   * (1 << order) continuous naturally-aligned elements.
   */
  int radix_tree_maybe_preload_order(gfp_t gfp_mask, int order)
  {
  	unsigned long nr_subtrees;
  	int nr_nodes, subtree_height;
  
  	/* Preloading doesn't help anything with this gfp mask, skip it */
  	if (!gfpflags_allow_blocking(gfp_mask)) {
  		preempt_disable();
  		return 0;
  	}
  
  	/*
  	 * Calculate number and height of fully populated subtrees it takes to
  	 * store (1 << order) elements.
  	 */
  	nr_subtrees = 1 << order;
  	for (subtree_height = 0; nr_subtrees > RADIX_TREE_MAP_SIZE;
  			subtree_height++)
  		nr_subtrees >>= RADIX_TREE_MAP_SHIFT;
  
  	/*
  	 * The worst case is zero height tree with a single item at index 0 and
  	 * then inserting items starting at ULONG_MAX - (1 << order).
  	 *
  	 * This requires RADIX_TREE_MAX_PATH nodes to build branch from root to
  	 * 0-index item.
  	 */
  	nr_nodes = RADIX_TREE_MAX_PATH;
  
  	/* Plus branch to fully populated subtrees. */
  	nr_nodes += RADIX_TREE_MAX_PATH - subtree_height;
  
  	/* Root node is shared. */
  	nr_nodes--;
  
  	/* Plus nodes required to build subtrees. */
  	nr_nodes += nr_subtrees * height_to_maxnodes[subtree_height];
  
  	return __radix_tree_preload(gfp_mask, nr_nodes);
  }
1456a439f   Matthew Wilcox   radix-tree: intro...
495
496
497
498
499
500
  static unsigned radix_tree_load_root(struct radix_tree_root *root,
  		struct radix_tree_node **nodep, unsigned long *maxindex)
  {
  	struct radix_tree_node *node = rcu_dereference_raw(root->rnode);
  
  	*nodep = node;
b194d16c2   Matthew Wilcox   radix-tree: renam...
501
  	if (likely(radix_tree_is_internal_node(node))) {
4dd6c0987   Matthew Wilcox   radix-tree: renam...
502
  		node = entry_to_node(node);
1456a439f   Matthew Wilcox   radix-tree: intro...
503
  		*maxindex = node_maxindex(node);
c12e51b07   Matthew Wilcox   radix-tree: repla...
504
  		return node->shift + RADIX_TREE_MAP_SHIFT;
1456a439f   Matthew Wilcox   radix-tree: intro...
505
506
507
508
509
  	}
  
  	*maxindex = 0;
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
510
511
512
  /*
   *	Extend a radix tree so it can store key @index.
   */
e61452365   Matthew Wilcox   radix_tree: add s...
513
  static int radix_tree_extend(struct radix_tree_root *root,
d0891265b   Matthew Wilcox   radix-tree: remov...
514
  				unsigned long index, unsigned int shift)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
515
  {
e2bdb933a   Hugh Dickins   radix_tree: take ...
516
  	struct radix_tree_node *slot;
d0891265b   Matthew Wilcox   radix-tree: remov...
517
  	unsigned int maxshift;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
518
  	int tag;
d0891265b   Matthew Wilcox   radix-tree: remov...
519
520
521
522
  	/* Figure out what the shift should be.  */
  	maxshift = shift;
  	while (index > shift_maxindex(maxshift))
  		maxshift += RADIX_TREE_MAP_SHIFT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
523

d0891265b   Matthew Wilcox   radix-tree: remov...
524
525
  	slot = root->rnode;
  	if (!slot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
526
  		goto out;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
527

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
528
  	do {
e8de43407   Matthew Wilcox   radix-tree: ensur...
529
530
  		struct radix_tree_node *node = radix_tree_node_alloc(root,
  							NULL, shift, 0, 1, 0);
2fcd9005c   Matthew Wilcox   radix-tree: misce...
531
  		if (!node)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
532
  			return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
533
  		/* Propagate the aggregated tag info into the new root */
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
534
  		for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++) {
612d6c19d   Nick Piggin   [PATCH] radix-tre...
535
  			if (root_tag_get(root, tag))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
536
537
  				tag_set(node, tag, 0);
  		}
d0891265b   Matthew Wilcox   radix-tree: remov...
538
  		BUG_ON(shift > BITS_PER_LONG);
f7942430e   Johannes Weiner   lib: radix-tree: ...
539
  		if (radix_tree_is_internal_node(slot)) {
4dd6c0987   Matthew Wilcox   radix-tree: renam...
540
  			entry_to_node(slot)->parent = node;
e8de43407   Matthew Wilcox   radix-tree: ensur...
541
  		} else if (radix_tree_exceptional_entry(slot)) {
f7942430e   Johannes Weiner   lib: radix-tree: ...
542
  			/* Moving an exceptional root->rnode to a node */
e8de43407   Matthew Wilcox   radix-tree: ensur...
543
  			node->exceptional = 1;
f7942430e   Johannes Weiner   lib: radix-tree: ...
544
  		}
e2bdb933a   Hugh Dickins   radix_tree: take ...
545
  		node->slots[0] = slot;
a4db4dcea   Matthew Wilcox   radix-tree: renam...
546
547
  		slot = node_to_entry(node);
  		rcu_assign_pointer(root->rnode, slot);
d0891265b   Matthew Wilcox   radix-tree: remov...
548
  		shift += RADIX_TREE_MAP_SHIFT;
d0891265b   Matthew Wilcox   radix-tree: remov...
549
  	} while (shift <= maxshift);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
550
  out:
d0891265b   Matthew Wilcox   radix-tree: remov...
551
  	return maxshift + RADIX_TREE_MAP_SHIFT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
552
553
554
  }
  
  /**
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
555
556
557
   *	radix_tree_shrink    -    shrink radix tree to minimum height
   *	@root		radix tree root
   */
14b468791   Johannes Weiner   mm: workingset: m...
558
  static inline void radix_tree_shrink(struct radix_tree_root *root,
4d693d086   Johannes Weiner   lib: radix-tree: ...
559
560
  				     radix_tree_update_node_t update_node,
  				     void *private)
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
561
  {
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
  	for (;;) {
  		struct radix_tree_node *node = root->rnode;
  		struct radix_tree_node *child;
  
  		if (!radix_tree_is_internal_node(node))
  			break;
  		node = entry_to_node(node);
  
  		/*
  		 * The candidate node has more than one child, or its child
  		 * is not at the leftmost slot, or the child is a multiorder
  		 * entry, we cannot shrink.
  		 */
  		if (node->count != 1)
  			break;
  		child = node->slots[0];
  		if (!child)
  			break;
  		if (!radix_tree_is_internal_node(child) && node->shift)
  			break;
  
  		if (radix_tree_is_internal_node(child))
  			entry_to_node(child)->parent = NULL;
  
  		/*
  		 * We don't need rcu_assign_pointer(), since we are simply
  		 * moving the node from one part of the tree to another: if it
  		 * was safe to dereference the old pointer to it
  		 * (node->slots[0]), it will be safe to dereference the new
  		 * one (root->rnode) as far as dependent read barriers go.
  		 */
  		root->rnode = child;
  
  		/*
  		 * We have a dilemma here. The node's slot[0] must not be
  		 * NULLed in case there are concurrent lookups expecting to
  		 * find the item. However if this was a bottom-level node,
  		 * then it may be subject to the slot pointer being visible
  		 * to callers dereferencing it. If item corresponding to
  		 * slot[0] is subsequently deleted, these callers would expect
  		 * their slot to become empty sooner or later.
  		 *
  		 * For example, lockless pagecache will look up a slot, deref
  		 * the page pointer, and if the page has 0 refcount it means it
  		 * was concurrently deleted from pagecache so try the deref
  		 * again. Fortunately there is already a requirement for logic
  		 * to retry the entire slot lookup -- the indirect pointer
  		 * problem (replacing direct root node with an indirect pointer
  		 * also results in a stale slot). So tag the slot as indirect
  		 * to force callers to retry.
  		 */
4d693d086   Johannes Weiner   lib: radix-tree: ...
613
614
  		node->count = 0;
  		if (!radix_tree_is_internal_node(child)) {
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
615
  			node->slots[0] = RADIX_TREE_RETRY;
4d693d086   Johannes Weiner   lib: radix-tree: ...
616
617
618
  			if (update_node)
  				update_node(node, private);
  		}
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
619
620
  
  		radix_tree_node_free(node);
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
621
  	}
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
622
  }
14b468791   Johannes Weiner   mm: workingset: m...
623
  static void delete_node(struct radix_tree_root *root,
4d693d086   Johannes Weiner   lib: radix-tree: ...
624
625
  			struct radix_tree_node *node,
  			radix_tree_update_node_t update_node, void *private)
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
626
  {
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
627
628
629
630
631
  	do {
  		struct radix_tree_node *parent;
  
  		if (node->count) {
  			if (node == entry_to_node(root->rnode))
14b468791   Johannes Weiner   mm: workingset: m...
632
633
  				radix_tree_shrink(root, update_node, private);
  			return;
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
634
635
636
637
638
639
640
641
642
643
644
645
  		}
  
  		parent = node->parent;
  		if (parent) {
  			parent->slots[node->offset] = NULL;
  			parent->count--;
  		} else {
  			root_tag_clear_all(root);
  			root->rnode = NULL;
  		}
  
  		radix_tree_node_free(node);
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
646
647
648
  
  		node = parent;
  	} while (node);
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
649
650
651
  }
  
  /**
139e56166   Johannes Weiner   lib: radix_tree: ...
652
   *	__radix_tree_create	-	create a slot in a radix tree
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
653
654
   *	@root:		radix tree root
   *	@index:		index key
e61452365   Matthew Wilcox   radix_tree: add s...
655
   *	@order:		index occupies 2^order aligned slots
139e56166   Johannes Weiner   lib: radix_tree: ...
656
657
   *	@nodep:		returns node
   *	@slotp:		returns slot
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
658
   *
139e56166   Johannes Weiner   lib: radix_tree: ...
659
660
661
662
663
664
665
666
   *	Create, if necessary, and return the node and slot for an item
   *	at position @index in the radix tree @root.
   *
   *	Until there is more than one item in the tree, no nodes are
   *	allocated and @root->rnode is used as a direct slot instead of
   *	pointing to a node, in which case *@nodep will be NULL.
   *
   *	Returns -ENOMEM, or 0 for success.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
667
   */
139e56166   Johannes Weiner   lib: radix_tree: ...
668
  int __radix_tree_create(struct radix_tree_root *root, unsigned long index,
e61452365   Matthew Wilcox   radix_tree: add s...
669
670
  			unsigned order, struct radix_tree_node **nodep,
  			void ***slotp)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
671
  {
89148aa40   Matthew Wilcox   radix-tree: tidy ...
672
673
  	struct radix_tree_node *node = NULL, *child;
  	void **slot = (void **)&root->rnode;
49ea6ebcd   Matthew Wilcox   radix-tree: fix e...
674
  	unsigned long maxindex;
89148aa40   Matthew Wilcox   radix-tree: tidy ...
675
  	unsigned int shift, offset = 0;
49ea6ebcd   Matthew Wilcox   radix-tree: fix e...
676
  	unsigned long max = index | ((1UL << order) - 1);
89148aa40   Matthew Wilcox   radix-tree: tidy ...
677
  	shift = radix_tree_load_root(root, &child, &maxindex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
678
679
  
  	/* Make sure the tree is high enough.  */
175542f57   Matthew Wilcox   radix-tree: add r...
680
681
  	if (order > 0 && max == ((1UL << order) - 1))
  		max++;
49ea6ebcd   Matthew Wilcox   radix-tree: fix e...
682
  	if (max > maxindex) {
d0891265b   Matthew Wilcox   radix-tree: remov...
683
  		int error = radix_tree_extend(root, max, shift);
49ea6ebcd   Matthew Wilcox   radix-tree: fix e...
684
  		if (error < 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
685
  			return error;
49ea6ebcd   Matthew Wilcox   radix-tree: fix e...
686
  		shift = error;
89148aa40   Matthew Wilcox   radix-tree: tidy ...
687
  		child = root->rnode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
688
  	}
e61452365   Matthew Wilcox   radix_tree: add s...
689
  	while (shift > order) {
c12e51b07   Matthew Wilcox   radix-tree: repla...
690
  		shift -= RADIX_TREE_MAP_SHIFT;
89148aa40   Matthew Wilcox   radix-tree: tidy ...
691
  		if (child == NULL) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
692
  			/* Have to add a child node.  */
e8de43407   Matthew Wilcox   radix-tree: ensur...
693
694
  			child = radix_tree_node_alloc(root, node, shift,
  							offset, 0, 0);
89148aa40   Matthew Wilcox   radix-tree: tidy ...
695
  			if (!child)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
696
  				return -ENOMEM;
89148aa40   Matthew Wilcox   radix-tree: tidy ...
697
698
  			rcu_assign_pointer(*slot, node_to_entry(child));
  			if (node)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
699
  				node->count++;
89148aa40   Matthew Wilcox   radix-tree: tidy ...
700
  		} else if (!radix_tree_is_internal_node(child))
e61452365   Matthew Wilcox   radix_tree: add s...
701
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
702
703
  
  		/* Go a level down */
89148aa40   Matthew Wilcox   radix-tree: tidy ...
704
  		node = entry_to_node(child);
9e85d8111   Matthew Wilcox   radix-tree: make ...
705
  		offset = radix_tree_descend(node, &child, index);
89148aa40   Matthew Wilcox   radix-tree: tidy ...
706
  		slot = &node->slots[offset];
e61452365   Matthew Wilcox   radix_tree: add s...
707
  	}
175542f57   Matthew Wilcox   radix-tree: add r...
708
709
710
711
712
713
  	if (nodep)
  		*nodep = node;
  	if (slotp)
  		*slotp = slot;
  	return 0;
  }
57578c2ea   Matthew Wilcox   raxix-tree: intro...
714
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
175542f57   Matthew Wilcox   radix-tree: add r...
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
  /*
   * Free any nodes below this node.  The tree is presumed to not need
   * shrinking, and any user data in the tree is presumed to not need a
   * destructor called on it.  If we need to add a destructor, we can
   * add that functionality later.  Note that we may not clear tags or
   * slots from the tree as an RCU walker may still have a pointer into
   * this subtree.  We could replace the entries with RADIX_TREE_RETRY,
   * but we'll still have to clear those in rcu_free.
   */
  static void radix_tree_free_nodes(struct radix_tree_node *node)
  {
  	unsigned offset = 0;
  	struct radix_tree_node *child = entry_to_node(node);
  
  	for (;;) {
  		void *entry = child->slots[offset];
  		if (radix_tree_is_internal_node(entry) &&
  					!is_sibling_entry(child, entry)) {
  			child = entry_to_node(entry);
  			offset = 0;
  			continue;
  		}
  		offset++;
  		while (offset == RADIX_TREE_MAP_SIZE) {
  			struct radix_tree_node *old = child;
  			offset = child->offset + 1;
  			child = child->parent;
  			radix_tree_node_free(old);
  			if (old == entry_to_node(node))
  				return;
  		}
  	}
  }
  
  static inline int insert_entries(struct radix_tree_node *node, void **slot,
  				void *item, unsigned order, bool replace)
  {
  	struct radix_tree_node *child;
  	unsigned i, n, tag, offset, tags = 0;
  
  	if (node) {
e157b5559   Matthew Wilcox   radix-tree: add r...
756
757
758
759
  		if (order > node->shift)
  			n = 1 << (order - node->shift);
  		else
  			n = 1;
175542f57   Matthew Wilcox   radix-tree: add r...
760
761
762
763
764
765
766
  		offset = get_slot_offset(node, slot);
  	} else {
  		n = 1;
  		offset = 0;
  	}
  
  	if (n > 1) {
e61452365   Matthew Wilcox   radix_tree: add s...
767
  		offset = offset & ~(n - 1);
89148aa40   Matthew Wilcox   radix-tree: tidy ...
768
  		slot = &node->slots[offset];
175542f57   Matthew Wilcox   radix-tree: add r...
769
770
771
772
773
774
775
776
777
778
779
  	}
  	child = node_to_entry(slot);
  
  	for (i = 0; i < n; i++) {
  		if (slot[i]) {
  			if (replace) {
  				node->count--;
  				for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  					if (tag_get(node, tag, offset + i))
  						tags |= 1 << tag;
  			} else
e61452365   Matthew Wilcox   radix_tree: add s...
780
781
  				return -EEXIST;
  		}
175542f57   Matthew Wilcox   radix-tree: add r...
782
  	}
e61452365   Matthew Wilcox   radix_tree: add s...
783

175542f57   Matthew Wilcox   radix-tree: add r...
784
785
786
  	for (i = 0; i < n; i++) {
  		struct radix_tree_node *old = slot[i];
  		if (i) {
89148aa40   Matthew Wilcox   radix-tree: tidy ...
787
  			rcu_assign_pointer(slot[i], child);
175542f57   Matthew Wilcox   radix-tree: add r...
788
789
790
791
792
793
794
795
  			for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  				if (tags & (1 << tag))
  					tag_clear(node, tag, offset + i);
  		} else {
  			rcu_assign_pointer(slot[i], item);
  			for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  				if (tags & (1 << tag))
  					tag_set(node, tag, offset);
e61452365   Matthew Wilcox   radix_tree: add s...
796
  		}
175542f57   Matthew Wilcox   radix-tree: add r...
797
  		if (radix_tree_is_internal_node(old) &&
e157b5559   Matthew Wilcox   radix-tree: add r...
798
799
  					!is_sibling_entry(node, old) &&
  					(old != RADIX_TREE_RETRY))
175542f57   Matthew Wilcox   radix-tree: add r...
800
801
802
  			radix_tree_free_nodes(old);
  		if (radix_tree_exceptional_entry(old))
  			node->exceptional--;
612d6c19d   Nick Piggin   [PATCH] radix-tre...
803
  	}
175542f57   Matthew Wilcox   radix-tree: add r...
804
805
806
807
808
809
  	if (node) {
  		node->count += n;
  		if (radix_tree_exceptional_entry(item))
  			node->exceptional += n;
  	}
  	return n;
139e56166   Johannes Weiner   lib: radix_tree: ...
810
  }
175542f57   Matthew Wilcox   radix-tree: add r...
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
  #else
  static inline int insert_entries(struct radix_tree_node *node, void **slot,
  				void *item, unsigned order, bool replace)
  {
  	if (*slot)
  		return -EEXIST;
  	rcu_assign_pointer(*slot, item);
  	if (node) {
  		node->count++;
  		if (radix_tree_exceptional_entry(item))
  			node->exceptional++;
  	}
  	return 1;
  }
  #endif
139e56166   Johannes Weiner   lib: radix_tree: ...
826
827
  
  /**
e61452365   Matthew Wilcox   radix_tree: add s...
828
   *	__radix_tree_insert    -    insert into a radix tree
139e56166   Johannes Weiner   lib: radix_tree: ...
829
830
   *	@root:		radix tree root
   *	@index:		index key
e61452365   Matthew Wilcox   radix_tree: add s...
831
   *	@order:		key covers the 2^order indices around index
139e56166   Johannes Weiner   lib: radix_tree: ...
832
833
834
835
   *	@item:		item to insert
   *
   *	Insert an item into the radix tree at position @index.
   */
e61452365   Matthew Wilcox   radix_tree: add s...
836
837
  int __radix_tree_insert(struct radix_tree_root *root, unsigned long index,
  			unsigned order, void *item)
139e56166   Johannes Weiner   lib: radix_tree: ...
838
839
840
841
  {
  	struct radix_tree_node *node;
  	void **slot;
  	int error;
b194d16c2   Matthew Wilcox   radix-tree: renam...
842
  	BUG_ON(radix_tree_is_internal_node(item));
139e56166   Johannes Weiner   lib: radix_tree: ...
843

e61452365   Matthew Wilcox   radix_tree: add s...
844
  	error = __radix_tree_create(root, index, order, &node, &slot);
139e56166   Johannes Weiner   lib: radix_tree: ...
845
846
  	if (error)
  		return error;
175542f57   Matthew Wilcox   radix-tree: add r...
847
848
849
850
  
  	error = insert_entries(node, slot, item, order, false);
  	if (error < 0)
  		return error;
201b6264f   Christoph Lameter   [PATCH] radix-tre...
851

612d6c19d   Nick Piggin   [PATCH] radix-tre...
852
  	if (node) {
7b60e9ad5   Matthew Wilcox   radix-tree: fix m...
853
  		unsigned offset = get_slot_offset(node, slot);
7b60e9ad5   Matthew Wilcox   radix-tree: fix m...
854
855
856
  		BUG_ON(tag_get(node, 0, offset));
  		BUG_ON(tag_get(node, 1, offset));
  		BUG_ON(tag_get(node, 2, offset));
612d6c19d   Nick Piggin   [PATCH] radix-tre...
857
  	} else {
7b60e9ad5   Matthew Wilcox   radix-tree: fix m...
858
  		BUG_ON(root_tags_get(root));
612d6c19d   Nick Piggin   [PATCH] radix-tre...
859
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
860

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
861
862
  	return 0;
  }
e61452365   Matthew Wilcox   radix_tree: add s...
863
  EXPORT_SYMBOL(__radix_tree_insert);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
864

139e56166   Johannes Weiner   lib: radix_tree: ...
865
866
867
868
869
870
871
872
873
874
875
876
877
  /**
   *	__radix_tree_lookup	-	lookup an item in a radix tree
   *	@root:		radix tree root
   *	@index:		index key
   *	@nodep:		returns node
   *	@slotp:		returns slot
   *
   *	Lookup and return the item at position @index in the radix
   *	tree @root.
   *
   *	Until there is more than one item in the tree, no nodes are
   *	allocated and @root->rnode is used as a direct slot instead of
   *	pointing to a node, in which case *@nodep will be NULL.
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
878
   */
139e56166   Johannes Weiner   lib: radix_tree: ...
879
880
  void *__radix_tree_lookup(struct radix_tree_root *root, unsigned long index,
  			  struct radix_tree_node **nodep, void ***slotp)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
881
  {
139e56166   Johannes Weiner   lib: radix_tree: ...
882
  	struct radix_tree_node *node, *parent;
858299544   Matthew Wilcox   radix-tree: rewri...
883
  	unsigned long maxindex;
139e56166   Johannes Weiner   lib: radix_tree: ...
884
  	void **slot;
612d6c19d   Nick Piggin   [PATCH] radix-tre...
885

858299544   Matthew Wilcox   radix-tree: rewri...
886
887
888
   restart:
  	parent = NULL;
  	slot = (void **)&root->rnode;
9e85d8111   Matthew Wilcox   radix-tree: make ...
889
  	radix_tree_load_root(root, &node, &maxindex);
858299544   Matthew Wilcox   radix-tree: rewri...
890
  	if (index > maxindex)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
891
  		return NULL;
b194d16c2   Matthew Wilcox   radix-tree: renam...
892
  	while (radix_tree_is_internal_node(node)) {
858299544   Matthew Wilcox   radix-tree: rewri...
893
  		unsigned offset;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
894

858299544   Matthew Wilcox   radix-tree: rewri...
895
896
  		if (node == RADIX_TREE_RETRY)
  			goto restart;
4dd6c0987   Matthew Wilcox   radix-tree: renam...
897
  		parent = entry_to_node(node);
9e85d8111   Matthew Wilcox   radix-tree: make ...
898
  		offset = radix_tree_descend(parent, &node, index);
858299544   Matthew Wilcox   radix-tree: rewri...
899
900
  		slot = parent->slots + offset;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
901

139e56166   Johannes Weiner   lib: radix_tree: ...
902
903
904
905
906
  	if (nodep)
  		*nodep = parent;
  	if (slotp)
  		*slotp = slot;
  	return node;
b72b71c6c   Huang Shijie   lib: do code opti...
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
  }
  
  /**
   *	radix_tree_lookup_slot    -    lookup a slot in a radix tree
   *	@root:		radix tree root
   *	@index:		index key
   *
   *	Returns:  the slot corresponding to the position @index in the
   *	radix tree @root. This is useful for update-if-exists operations.
   *
   *	This function can be called under rcu_read_lock iff the slot is not
   *	modified by radix_tree_replace_slot, otherwise it must be called
   *	exclusive from other writers. Any dereference of the slot must be done
   *	using radix_tree_deref_slot.
   */
  void **radix_tree_lookup_slot(struct radix_tree_root *root, unsigned long index)
  {
139e56166   Johannes Weiner   lib: radix_tree: ...
924
925
926
927
928
  	void **slot;
  
  	if (!__radix_tree_lookup(root, index, NULL, &slot))
  		return NULL;
  	return slot;
a43313668   Hans Reiser   [PATCH] reiser4: ...
929
  }
a43313668   Hans Reiser   [PATCH] reiser4: ...
930
931
932
933
934
935
936
937
  EXPORT_SYMBOL(radix_tree_lookup_slot);
  
  /**
   *	radix_tree_lookup    -    perform lookup operation on a radix tree
   *	@root:		radix tree root
   *	@index:		index key
   *
   *	Lookup the item at the position @index in the radix tree @root.
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
938
939
940
941
942
   *
   *	This function can be called under rcu_read_lock, however the caller
   *	must manage lifetimes of leaf nodes (eg. RCU may also be used to free
   *	them safely). No RCU barriers are required to access or modify the
   *	returned item, however.
a43313668   Hans Reiser   [PATCH] reiser4: ...
943
944
945
   */
  void *radix_tree_lookup(struct radix_tree_root *root, unsigned long index)
  {
139e56166   Johannes Weiner   lib: radix_tree: ...
946
  	return __radix_tree_lookup(root, index, NULL, NULL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
947
948
  }
  EXPORT_SYMBOL(radix_tree_lookup);
a90eb3a2a   Matthew Wilcox   radix-tree: fix r...
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
  static inline int slot_count(struct radix_tree_node *node,
  						void **slot)
  {
  	int n = 1;
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  	void *ptr = node_to_entry(slot);
  	unsigned offset = get_slot_offset(node, slot);
  	int i;
  
  	for (i = 1; offset + i < RADIX_TREE_MAP_SIZE; i++) {
  		if (node->slots[offset + i] != ptr)
  			break;
  		n++;
  	}
  #endif
  	return n;
  }
6d75f366b   Johannes Weiner   lib: radix-tree: ...
966
967
968
969
  static void replace_slot(struct radix_tree_root *root,
  			 struct radix_tree_node *node,
  			 void **slot, void *item,
  			 bool warn_typeswitch)
f7942430e   Johannes Weiner   lib: radix-tree: ...
970
971
  {
  	void *old = rcu_dereference_raw(*slot);
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
972
  	int count, exceptional;
f7942430e   Johannes Weiner   lib: radix-tree: ...
973
974
  
  	WARN_ON_ONCE(radix_tree_is_internal_node(item));
f7942430e   Johannes Weiner   lib: radix-tree: ...
975

f4b109c6d   Johannes Weiner   lib: radix-tree: ...
976
  	count = !!item - !!old;
f7942430e   Johannes Weiner   lib: radix-tree: ...
977
978
  	exceptional = !!radix_tree_exceptional_entry(item) -
  		      !!radix_tree_exceptional_entry(old);
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
979
  	WARN_ON_ONCE(warn_typeswitch && (count || exceptional));
f7942430e   Johannes Weiner   lib: radix-tree: ...
980

f4b109c6d   Johannes Weiner   lib: radix-tree: ...
981
982
  	if (node) {
  		node->count += count;
a90eb3a2a   Matthew Wilcox   radix-tree: fix r...
983
984
985
986
  		if (exceptional) {
  			exceptional *= slot_count(node, slot);
  			node->exceptional += exceptional;
  		}
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
987
  	}
f7942430e   Johannes Weiner   lib: radix-tree: ...
988
989
990
  
  	rcu_assign_pointer(*slot, item);
  }
a90eb3a2a   Matthew Wilcox   radix-tree: fix r...
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
  static inline void delete_sibling_entries(struct radix_tree_node *node,
  						void **slot)
  {
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  	bool exceptional = radix_tree_exceptional_entry(*slot);
  	void *ptr = node_to_entry(slot);
  	unsigned offset = get_slot_offset(node, slot);
  	int i;
  
  	for (i = 1; offset + i < RADIX_TREE_MAP_SIZE; i++) {
  		if (node->slots[offset + i] != ptr)
  			break;
  		node->slots[offset + i] = NULL;
  		node->count--;
  		if (exceptional)
  			node->exceptional--;
  	}
  #endif
  }
f7942430e   Johannes Weiner   lib: radix-tree: ...
1010
  /**
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1011
   * __radix_tree_replace		- replace item in a slot
4d693d086   Johannes Weiner   lib: radix-tree: ...
1012
1013
1014
1015
1016
1017
   * @root:		radix tree root
   * @node:		pointer to tree node
   * @slot:		pointer to slot in @node
   * @item:		new item to store in the slot.
   * @update_node:	callback for changing leaf nodes
   * @private:		private data to pass to @update_node
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1018
1019
1020
1021
1022
1023
   *
   * For use with __radix_tree_lookup().  Caller must hold tree write locked
   * across slot lookup and replacement.
   */
  void __radix_tree_replace(struct radix_tree_root *root,
  			  struct radix_tree_node *node,
4d693d086   Johannes Weiner   lib: radix-tree: ...
1024
1025
  			  void **slot, void *item,
  			  radix_tree_update_node_t update_node, void *private)
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1026
  {
a90eb3a2a   Matthew Wilcox   radix-tree: fix r...
1027
1028
  	if (!item)
  		delete_sibling_entries(node, slot);
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1029
  	/*
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
1030
1031
1032
  	 * This function supports replacing exceptional entries and
  	 * deleting entries, but that needs accounting against the
  	 * node unless the slot is root->rnode.
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1033
1034
1035
  	 */
  	replace_slot(root, node, slot, item,
  		     !node && slot != (void **)&root->rnode);
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
1036

4d693d086   Johannes Weiner   lib: radix-tree: ...
1037
1038
1039
1040
1041
1042
1043
  	if (!node)
  		return;
  
  	if (update_node)
  		update_node(node, private);
  
  	delete_node(root, node, update_node, private);
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
  }
  
  /**
   * radix_tree_replace_slot	- replace item in a slot
   * @root:	radix tree root
   * @slot:	pointer to slot
   * @item:	new item to store in the slot.
   *
   * For use with radix_tree_lookup_slot(), radix_tree_gang_lookup_slot(),
   * radix_tree_gang_lookup_tag_slot().  Caller must hold tree write locked
   * across slot lookup and replacement.
   *
   * NOTE: This cannot be used to switch between non-entries (empty slots),
   * regular entries, and exceptional entries, as that requires accounting
f4b109c6d   Johannes Weiner   lib: radix-tree: ...
1058
   * inside the radix tree node. When switching from one type of entry or
e157b5559   Matthew Wilcox   radix-tree: add r...
1059
1060
   * deleting, use __radix_tree_lookup() and __radix_tree_replace() or
   * radix_tree_iter_replace().
6d75f366b   Johannes Weiner   lib: radix-tree: ...
1061
1062
1063
1064
1065
1066
   */
  void radix_tree_replace_slot(struct radix_tree_root *root,
  			     void **slot, void *item)
  {
  	replace_slot(root, NULL, slot, item, true);
  }
e157b5559   Matthew Wilcox   radix-tree: add r...
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
  /**
   * radix_tree_iter_replace - replace item in a slot
   * @root:	radix tree root
   * @slot:	pointer to slot
   * @item:	new item to store in the slot.
   *
   * For use with radix_tree_split() and radix_tree_for_each_slot().
   * Caller must hold tree write locked across split and replacement.
   */
  void radix_tree_iter_replace(struct radix_tree_root *root,
  		const struct radix_tree_iter *iter, void **slot, void *item)
  {
  	__radix_tree_replace(root, iter->node, slot, item, NULL, NULL);
  }
175542f57   Matthew Wilcox   radix-tree: add r...
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  /**
   * radix_tree_join - replace multiple entries with one multiorder entry
   * @root: radix tree root
   * @index: an index inside the new entry
   * @order: order of the new entry
   * @item: new entry
   *
   * Call this function to replace several entries with one larger entry.
   * The existing entries are presumed to not need freeing as a result of
   * this call.
   *
   * The replacement entry will have all the tags set on it that were set
   * on any of the entries it is replacing.
   */
  int radix_tree_join(struct radix_tree_root *root, unsigned long index,
  			unsigned order, void *item)
  {
  	struct radix_tree_node *node;
  	void **slot;
  	int error;
  
  	BUG_ON(radix_tree_is_internal_node(item));
  
  	error = __radix_tree_create(root, index, order, &node, &slot);
  	if (!error)
  		error = insert_entries(node, slot, item, order, true);
  	if (error > 0)
  		error = 0;
  
  	return error;
  }
e157b5559   Matthew Wilcox   radix-tree: add r...
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
  
  /**
   * radix_tree_split - Split an entry into smaller entries
   * @root: radix tree root
   * @index: An index within the large entry
   * @order: Order of new entries
   *
   * Call this function as the first step in replacing a multiorder entry
   * with several entries of lower order.  After this function returns,
   * loop over the relevant portion of the tree using radix_tree_for_each_slot()
   * and call radix_tree_iter_replace() to set up each new entry.
   *
   * The tags from this entry are replicated to all the new entries.
   *
   * The radix tree should be locked against modification during the entire
   * replacement operation.  Lock-free lookups will see RADIX_TREE_RETRY which
   * should prompt RCU walkers to restart the lookup from the root.
   */
  int radix_tree_split(struct radix_tree_root *root, unsigned long index,
  				unsigned order)
  {
  	struct radix_tree_node *parent, *node, *child;
  	void **slot;
  	unsigned int offset, end;
  	unsigned n, tag, tags = 0;
  
  	if (!__radix_tree_lookup(root, index, &parent, &slot))
  		return -ENOENT;
  	if (!parent)
  		return -ENOENT;
  
  	offset = get_slot_offset(parent, slot);
  
  	for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  		if (tag_get(parent, tag, offset))
  			tags |= 1 << tag;
  
  	for (end = offset + 1; end < RADIX_TREE_MAP_SIZE; end++) {
  		if (!is_sibling_entry(parent, parent->slots[end]))
  			break;
  		for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  			if (tags & (1 << tag))
  				tag_set(parent, tag, end);
  		/* rcu_assign_pointer ensures tags are set before RETRY */
  		rcu_assign_pointer(parent->slots[end], RADIX_TREE_RETRY);
  	}
  	rcu_assign_pointer(parent->slots[offset], RADIX_TREE_RETRY);
  	parent->exceptional -= (end - offset);
  
  	if (order == parent->shift)
  		return 0;
  	if (order > parent->shift) {
  		while (offset < end)
  			offset += insert_entries(parent, &parent->slots[offset],
  					RADIX_TREE_RETRY, order, true);
  		return 0;
  	}
  
  	node = parent;
  
  	for (;;) {
  		if (node->shift > order) {
e8de43407   Matthew Wilcox   radix-tree: ensur...
1175
1176
1177
  			child = radix_tree_node_alloc(root, node,
  					node->shift - RADIX_TREE_MAP_SHIFT,
  					offset, 0, 0);
e157b5559   Matthew Wilcox   radix-tree: add r...
1178
1179
  			if (!child)
  				goto nomem;
e157b5559   Matthew Wilcox   radix-tree: add r...
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
  			if (node != parent) {
  				node->count++;
  				node->slots[offset] = node_to_entry(child);
  				for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  					if (tags & (1 << tag))
  						tag_set(node, tag, offset);
  			}
  
  			node = child;
  			offset = 0;
  			continue;
  		}
  
  		n = insert_entries(node, &node->slots[offset],
  					RADIX_TREE_RETRY, order, false);
  		BUG_ON(n > RADIX_TREE_MAP_SIZE);
  
  		for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  			if (tags & (1 << tag))
  				tag_set(node, tag, offset);
  		offset += n;
  
  		while (offset == RADIX_TREE_MAP_SIZE) {
  			if (node == parent)
  				break;
  			offset = node->offset;
  			child = node;
  			node = node->parent;
  			rcu_assign_pointer(node->slots[offset],
  						node_to_entry(child));
  			offset++;
  		}
  		if ((node == parent) && (offset == end))
  			return 0;
  	}
  
   nomem:
  	/* Shouldn't happen; did user forget to preload? */
  	/* TODO: free all the allocated nodes */
  	WARN_ON(1);
  	return -ENOMEM;
  }
175542f57   Matthew Wilcox   radix-tree: add r...
1222
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1223
1224
1225
1226
  /**
   *	radix_tree_tag_set - set a tag on a radix tree node
   *	@root:		radix tree root
   *	@index:		index key
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1227
   *	@tag:		tag index
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1228
   *
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1229
1230
   *	Set the search tag (which must be < RADIX_TREE_MAX_TAGS)
   *	corresponding to @index in the radix tree.  From
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1231
1232
   *	the root all the way down to the leaf node.
   *
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1233
   *	Returns the address of the tagged item.  Setting a tag on a not-present
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1234
1235
1236
   *	item is a bug.
   */
  void *radix_tree_tag_set(struct radix_tree_root *root,
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1237
  			unsigned long index, unsigned int tag)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1238
  {
fb969909d   Ross Zwisler   radix-tree: rewri...
1239
1240
  	struct radix_tree_node *node, *parent;
  	unsigned long maxindex;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1241

9e85d8111   Matthew Wilcox   radix-tree: make ...
1242
  	radix_tree_load_root(root, &node, &maxindex);
fb969909d   Ross Zwisler   radix-tree: rewri...
1243
  	BUG_ON(index > maxindex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1244

b194d16c2   Matthew Wilcox   radix-tree: renam...
1245
  	while (radix_tree_is_internal_node(node)) {
fb969909d   Ross Zwisler   radix-tree: rewri...
1246
  		unsigned offset;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1247

4dd6c0987   Matthew Wilcox   radix-tree: renam...
1248
  		parent = entry_to_node(node);
9e85d8111   Matthew Wilcox   radix-tree: make ...
1249
  		offset = radix_tree_descend(parent, &node, index);
fb969909d   Ross Zwisler   radix-tree: rewri...
1250
1251
1252
1253
  		BUG_ON(!node);
  
  		if (!tag_get(parent, tag, offset))
  			tag_set(parent, tag, offset);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1254
  	}
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1255
  	/* set the root's tag bit */
fb969909d   Ross Zwisler   radix-tree: rewri...
1256
  	if (!root_tag_get(root, tag))
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1257
  		root_tag_set(root, tag);
fb969909d   Ross Zwisler   radix-tree: rewri...
1258
  	return node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1259
1260
  }
  EXPORT_SYMBOL(radix_tree_tag_set);
d604c3245   Matthew Wilcox   radix-tree: intro...
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
  static void node_tag_clear(struct radix_tree_root *root,
  				struct radix_tree_node *node,
  				unsigned int tag, unsigned int offset)
  {
  	while (node) {
  		if (!tag_get(node, tag, offset))
  			return;
  		tag_clear(node, tag, offset);
  		if (any_tag_set(node, tag))
  			return;
  
  		offset = node->offset;
  		node = node->parent;
  	}
  
  	/* clear the root's tag bit */
  	if (root_tag_get(root, tag))
  		root_tag_clear(root, tag);
  }
9498d2bb3   Matthew Wilcox   radix-tree: creat...
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
  static void node_tag_set(struct radix_tree_root *root,
  				struct radix_tree_node *node,
  				unsigned int tag, unsigned int offset)
  {
  	while (node) {
  		if (tag_get(node, tag, offset))
  			return;
  		tag_set(node, tag, offset);
  		offset = node->offset;
  		node = node->parent;
  	}
  
  	if (!root_tag_get(root, tag))
  		root_tag_set(root, tag);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1295
  /**
268f42de7   Matthew Wilcox   radix-tree: delet...
1296
1297
1298
1299
1300
1301
1302
1303
1304
1305
1306
1307
   * radix_tree_iter_tag_set - set a tag on the current iterator entry
   * @root:	radix tree root
   * @iter:	iterator state
   * @tag:	tag to set
   */
  void radix_tree_iter_tag_set(struct radix_tree_root *root,
  			const struct radix_tree_iter *iter, unsigned int tag)
  {
  	node_tag_set(root, iter->node, tag, iter_offset(iter));
  }
  
  /**
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1308
1309
1310
   *	radix_tree_tag_clear - clear a tag on a radix tree node
   *	@root:		radix tree root
   *	@index:		index key
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1311
   *	@tag:		tag index
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1312
   *
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1313
   *	Clear the search tag (which must be < RADIX_TREE_MAX_TAGS)
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1314
1315
   *	corresponding to @index in the radix tree.  If this causes
   *	the leaf node to have no tags set then clear the tag in the
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1316
1317
1318
1319
1320
1321
   *	next-to-leaf node, etc.
   *
   *	Returns the address of the tagged item on success, else NULL.  ie:
   *	has the same return value and semantics as radix_tree_lookup().
   */
  void *radix_tree_tag_clear(struct radix_tree_root *root,
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1322
  			unsigned long index, unsigned int tag)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1323
  {
00f47b581   Ross Zwisler   radix-tree: rewri...
1324
1325
  	struct radix_tree_node *node, *parent;
  	unsigned long maxindex;
e2bdb933a   Hugh Dickins   radix_tree: take ...
1326
  	int uninitialized_var(offset);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1327

9e85d8111   Matthew Wilcox   radix-tree: make ...
1328
  	radix_tree_load_root(root, &node, &maxindex);
00f47b581   Ross Zwisler   radix-tree: rewri...
1329
1330
  	if (index > maxindex)
  		return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1331

00f47b581   Ross Zwisler   radix-tree: rewri...
1332
  	parent = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1333

b194d16c2   Matthew Wilcox   radix-tree: renam...
1334
  	while (radix_tree_is_internal_node(node)) {
4dd6c0987   Matthew Wilcox   radix-tree: renam...
1335
  		parent = entry_to_node(node);
9e85d8111   Matthew Wilcox   radix-tree: make ...
1336
  		offset = radix_tree_descend(parent, &node, index);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1337
  	}
d604c3245   Matthew Wilcox   radix-tree: intro...
1338
1339
  	if (node)
  		node_tag_clear(root, parent, tag, offset);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1340

00f47b581   Ross Zwisler   radix-tree: rewri...
1341
  	return node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1342
1343
  }
  EXPORT_SYMBOL(radix_tree_tag_clear);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1344
  /**
32605a181   Marcelo Tosatti   [PATCH] radix_tag...
1345
1346
1347
   * radix_tree_tag_get - get a tag on a radix tree node
   * @root:		radix tree root
   * @index:		index key
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1348
   * @tag:		tag index (< RADIX_TREE_MAX_TAGS)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1349
   *
32605a181   Marcelo Tosatti   [PATCH] radix_tag...
1350
   * Return values:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1351
   *
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1352
1353
   *  0: tag not present or not set
   *  1: tag set
ce82653d6   David Howells   radix_tree_tag_ge...
1354
1355
1356
1357
   *
   * Note that the return value of this function may not be relied on, even if
   * the RCU lock is held, unless tag modification and node deletion are excluded
   * from concurrency.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1358
1359
   */
  int radix_tree_tag_get(struct radix_tree_root *root,
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1360
  			unsigned long index, unsigned int tag)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1361
  {
4589ba6d0   Ross Zwisler   radix-tree: rewri...
1362
1363
  	struct radix_tree_node *node, *parent;
  	unsigned long maxindex;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1364

612d6c19d   Nick Piggin   [PATCH] radix-tre...
1365
1366
  	if (!root_tag_get(root, tag))
  		return 0;
9e85d8111   Matthew Wilcox   radix-tree: make ...
1367
  	radix_tree_load_root(root, &node, &maxindex);
4589ba6d0   Ross Zwisler   radix-tree: rewri...
1368
1369
  	if (index > maxindex)
  		return 0;
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1370
1371
  	if (node == NULL)
  		return 0;
b194d16c2   Matthew Wilcox   radix-tree: renam...
1372
  	while (radix_tree_is_internal_node(node)) {
9e85d8111   Matthew Wilcox   radix-tree: make ...
1373
  		unsigned offset;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1374

4dd6c0987   Matthew Wilcox   radix-tree: renam...
1375
  		parent = entry_to_node(node);
9e85d8111   Matthew Wilcox   radix-tree: make ...
1376
  		offset = radix_tree_descend(parent, &node, index);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1377

4589ba6d0   Ross Zwisler   radix-tree: rewri...
1378
  		if (!node)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1379
  			return 0;
4589ba6d0   Ross Zwisler   radix-tree: rewri...
1380
  		if (!tag_get(parent, tag, offset))
3fa36acbc   Hugh Dickins   radix_tree: clean...
1381
  			return 0;
4589ba6d0   Ross Zwisler   radix-tree: rewri...
1382
1383
  		if (node == RADIX_TREE_RETRY)
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1384
  	}
4589ba6d0   Ross Zwisler   radix-tree: rewri...
1385
1386
  
  	return 1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1387
1388
  }
  EXPORT_SYMBOL(radix_tree_tag_get);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1389

21ef53393   Ross Zwisler   radix-tree: add s...
1390
1391
1392
1393
1394
1395
1396
  static inline void __set_iter_shift(struct radix_tree_iter *iter,
  					unsigned int shift)
  {
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  	iter->shift = shift;
  #endif
  }
148deab22   Matthew Wilcox   radix-tree: impro...
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
1417
1418
1419
1420
1421
1422
1423
1424
1425
1426
1427
1428
1429
1430
1431
1432
1433
1434
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
  /* Construct iter->tags bit-mask from node->tags[tag] array */
  static void set_iter_tags(struct radix_tree_iter *iter,
  				struct radix_tree_node *node, unsigned offset,
  				unsigned tag)
  {
  	unsigned tag_long = offset / BITS_PER_LONG;
  	unsigned tag_bit  = offset % BITS_PER_LONG;
  
  	iter->tags = node->tags[tag][tag_long] >> tag_bit;
  
  	/* This never happens if RADIX_TREE_TAG_LONGS == 1 */
  	if (tag_long < RADIX_TREE_TAG_LONGS - 1) {
  		/* Pick tags from next element */
  		if (tag_bit)
  			iter->tags |= node->tags[tag][tag_long + 1] <<
  						(BITS_PER_LONG - tag_bit);
  		/* Clip chunk size, here only BITS_PER_LONG tags */
  		iter->next_index = __radix_tree_iter_add(iter, BITS_PER_LONG);
  	}
  }
  
  #ifdef CONFIG_RADIX_TREE_MULTIORDER
  static void **skip_siblings(struct radix_tree_node **nodep,
  			void **slot, struct radix_tree_iter *iter)
  {
  	void *sib = node_to_entry(slot - 1);
  
  	while (iter->index < iter->next_index) {
  		*nodep = rcu_dereference_raw(*slot);
  		if (*nodep && *nodep != sib)
  			return slot;
  		slot++;
  		iter->index = __radix_tree_iter_add(iter, 1);
  		iter->tags >>= 1;
  	}
  
  	*nodep = NULL;
  	return NULL;
  }
  
  void ** __radix_tree_next_slot(void **slot, struct radix_tree_iter *iter,
  					unsigned flags)
  {
  	unsigned tag = flags & RADIX_TREE_ITER_TAG_MASK;
  	struct radix_tree_node *node = rcu_dereference_raw(*slot);
  
  	slot = skip_siblings(&node, slot, iter);
  
  	while (radix_tree_is_internal_node(node)) {
  		unsigned offset;
  		unsigned long next_index;
  
  		if (node == RADIX_TREE_RETRY)
  			return slot;
  		node = entry_to_node(node);
268f42de7   Matthew Wilcox   radix-tree: delet...
1452
  		iter->node = node;
148deab22   Matthew Wilcox   radix-tree: impro...
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
1484
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
1497
1498
1499
1500
1501
1502
1503
1504
1505
1506
1507
1508
1509
1510
  		iter->shift = node->shift;
  
  		if (flags & RADIX_TREE_ITER_TAGGED) {
  			offset = radix_tree_find_next_bit(node, tag, 0);
  			if (offset == RADIX_TREE_MAP_SIZE)
  				return NULL;
  			slot = &node->slots[offset];
  			iter->index = __radix_tree_iter_add(iter, offset);
  			set_iter_tags(iter, node, offset, tag);
  			node = rcu_dereference_raw(*slot);
  		} else {
  			offset = 0;
  			slot = &node->slots[0];
  			for (;;) {
  				node = rcu_dereference_raw(*slot);
  				if (node)
  					break;
  				slot++;
  				offset++;
  				if (offset == RADIX_TREE_MAP_SIZE)
  					return NULL;
  			}
  			iter->index = __radix_tree_iter_add(iter, offset);
  		}
  		if ((flags & RADIX_TREE_ITER_CONTIG) && (offset > 0))
  			goto none;
  		next_index = (iter->index | shift_maxindex(iter->shift)) + 1;
  		if (next_index < iter->next_index)
  			iter->next_index = next_index;
  	}
  
  	return slot;
   none:
  	iter->next_index = 0;
  	return NULL;
  }
  EXPORT_SYMBOL(__radix_tree_next_slot);
  #else
  static void **skip_siblings(struct radix_tree_node **nodep,
  			void **slot, struct radix_tree_iter *iter)
  {
  	return slot;
  }
  #endif
  
  void **radix_tree_iter_resume(void **slot, struct radix_tree_iter *iter)
  {
  	struct radix_tree_node *node;
  
  	slot++;
  	iter->index = __radix_tree_iter_add(iter, 1);
  	node = rcu_dereference_raw(*slot);
  	skip_siblings(&node, slot, iter);
  	iter->next_index = iter->index;
  	iter->tags = 0;
  	return NULL;
  }
  EXPORT_SYMBOL(radix_tree_iter_resume);
6df8ba4f8   Fengguang Wu   radixtree: introd...
1511
  /**
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1512
1513
1514
1515
1516
1517
1518
1519
1520
1521
   * radix_tree_next_chunk - find next chunk of slots for iteration
   *
   * @root:	radix tree root
   * @iter:	iterator state
   * @flags:	RADIX_TREE_ITER_* flags and tag index
   * Returns:	pointer to chunk first slot, or NULL if iteration is over
   */
  void **radix_tree_next_chunk(struct radix_tree_root *root,
  			     struct radix_tree_iter *iter, unsigned flags)
  {
9e85d8111   Matthew Wilcox   radix-tree: make ...
1522
  	unsigned tag = flags & RADIX_TREE_ITER_TAG_MASK;
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1523
  	struct radix_tree_node *node, *child;
21ef53393   Ross Zwisler   radix-tree: add s...
1524
  	unsigned long index, offset, maxindex;
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1525
1526
1527
1528
1529
1530
1531
1532
1533
  
  	if ((flags & RADIX_TREE_ITER_TAGGED) && !root_tag_get(root, tag))
  		return NULL;
  
  	/*
  	 * Catch next_index overflow after ~0UL. iter->index never overflows
  	 * during iterating; it can be zero only at the beginning.
  	 * And we cannot overflow iter->next_index in a single step,
  	 * because RADIX_TREE_MAP_SHIFT < BITS_PER_LONG.
fffaee365   Konstantin Khlebnikov   radix-tree: fix c...
1534
1535
  	 *
  	 * This condition also used by radix_tree_next_slot() to stop
91b9677c4   Matthew Wilcox   radix-tree: fix typo
1536
  	 * contiguous iterating, and forbid switching to the next chunk.
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1537
1538
1539
1540
  	 */
  	index = iter->next_index;
  	if (!index && iter->index)
  		return NULL;
21ef53393   Ross Zwisler   radix-tree: add s...
1541
   restart:
9e85d8111   Matthew Wilcox   radix-tree: make ...
1542
  	radix_tree_load_root(root, &child, &maxindex);
21ef53393   Ross Zwisler   radix-tree: add s...
1543
1544
  	if (index > maxindex)
  		return NULL;
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1545
1546
  	if (!child)
  		return NULL;
21ef53393   Ross Zwisler   radix-tree: add s...
1547

8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1548
  	if (!radix_tree_is_internal_node(child)) {
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1549
  		/* Single-slot tree */
21ef53393   Ross Zwisler   radix-tree: add s...
1550
1551
  		iter->index = index;
  		iter->next_index = maxindex + 1;
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1552
  		iter->tags = 1;
268f42de7   Matthew Wilcox   radix-tree: delet...
1553
  		iter->node = NULL;
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1554
  		__set_iter_shift(iter, 0);
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1555
  		return (void **)&root->rnode;
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1556
  	}
21ef53393   Ross Zwisler   radix-tree: add s...
1557

8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1558
1559
  	do {
  		node = entry_to_node(child);
9e85d8111   Matthew Wilcox   radix-tree: make ...
1560
  		offset = radix_tree_descend(node, &child, index);
21ef53393   Ross Zwisler   radix-tree: add s...
1561

78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1562
  		if ((flags & RADIX_TREE_ITER_TAGGED) ?
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1563
  				!tag_get(node, tag, offset) : !child) {
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1564
1565
1566
1567
1568
  			/* Hole detected */
  			if (flags & RADIX_TREE_ITER_CONTIG)
  				return NULL;
  
  			if (flags & RADIX_TREE_ITER_TAGGED)
bc412fca6   Matthew Wilcox   radix-tree: make ...
1569
  				offset = radix_tree_find_next_bit(node, tag,
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1570
1571
1572
  						offset + 1);
  			else
  				while (++offset	< RADIX_TREE_MAP_SIZE) {
21ef53393   Ross Zwisler   radix-tree: add s...
1573
1574
1575
1576
  					void *slot = node->slots[offset];
  					if (is_sibling_entry(node, slot))
  						continue;
  					if (slot)
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1577
1578
  						break;
  				}
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1579
  			index &= ~node_maxindex(node);
9e85d8111   Matthew Wilcox   radix-tree: make ...
1580
  			index += offset << node->shift;
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1581
1582
1583
1584
1585
  			/* Overflow after ~0UL */
  			if (!index)
  				return NULL;
  			if (offset == RADIX_TREE_MAP_SIZE)
  				goto restart;
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1586
  			child = rcu_dereference_raw(node->slots[offset]);
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1587
  		}
e157b5559   Matthew Wilcox   radix-tree: add r...
1588
  		if (!child)
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1589
  			goto restart;
e157b5559   Matthew Wilcox   radix-tree: add r...
1590
1591
  		if (child == RADIX_TREE_RETRY)
  			break;
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1592
  	} while (radix_tree_is_internal_node(child));
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1593
1594
  
  	/* Update the iterator state */
8c1244de0   Matthew Wilcox   radix-tree: tidy ...
1595
1596
  	iter->index = (index &~ node_maxindex(node)) | (offset << node->shift);
  	iter->next_index = (index | node_maxindex(node)) + 1;
268f42de7   Matthew Wilcox   radix-tree: delet...
1597
  	iter->node = node;
9e85d8111   Matthew Wilcox   radix-tree: make ...
1598
  	__set_iter_shift(iter, node->shift);
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1599

148deab22   Matthew Wilcox   radix-tree: impro...
1600
1601
  	if (flags & RADIX_TREE_ITER_TAGGED)
  		set_iter_tags(iter, node, offset, tag);
78c1d7848   Konstantin Khlebnikov   radix-tree: intro...
1602
1603
1604
1605
1606
1607
  
  	return node->slots + offset;
  }
  EXPORT_SYMBOL(radix_tree_next_chunk);
  
  /**
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1608
1609
1610
1611
1612
1613
1614
1615
1616
1617
1618
   *	radix_tree_gang_lookup - perform multiple lookup on a radix tree
   *	@root:		radix tree root
   *	@results:	where the results of the lookup are placed
   *	@first_index:	start the lookup from this key
   *	@max_items:	place up to this many items at *results
   *
   *	Performs an index-ascending scan of the tree for present items.  Places
   *	them at *@results and returns the number of items which were placed at
   *	*@results.
   *
   *	The implementation is naive.
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1619
1620
1621
   *
   *	Like radix_tree_lookup, radix_tree_gang_lookup may be called under
   *	rcu_read_lock. In this case, rather than the returned results being
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1622
1623
1624
1625
   *	an atomic snapshot of the tree at a single point in time, the
   *	semantics of an RCU protected gang lookup are as though multiple
   *	radix_tree_lookups have been issued in individual locks, and results
   *	stored in 'results'.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1626
1627
1628
1629
1630
   */
  unsigned int
  radix_tree_gang_lookup(struct radix_tree_root *root, void **results,
  			unsigned long first_index, unsigned int max_items)
  {
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1631
1632
1633
  	struct radix_tree_iter iter;
  	void **slot;
  	unsigned int ret = 0;
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1634

cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1635
  	if (unlikely(!max_items))
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1636
  		return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1637

cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1638
  	radix_tree_for_each_slot(slot, root, &iter, first_index) {
46437f9a5   Matthew Wilcox   radix-tree: fix r...
1639
  		results[ret] = rcu_dereference_raw(*slot);
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1640
1641
  		if (!results[ret])
  			continue;
b194d16c2   Matthew Wilcox   radix-tree: renam...
1642
  		if (radix_tree_is_internal_node(results[ret])) {
46437f9a5   Matthew Wilcox   radix-tree: fix r...
1643
1644
1645
  			slot = radix_tree_iter_retry(&iter);
  			continue;
  		}
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1646
  		if (++ret == max_items)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1647
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1648
  	}
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1649

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1650
1651
1652
  	return ret;
  }
  EXPORT_SYMBOL(radix_tree_gang_lookup);
47feff2c8   Nick Piggin   radix-tree: add g...
1653
1654
1655
1656
  /**
   *	radix_tree_gang_lookup_slot - perform multiple slot lookup on radix tree
   *	@root:		radix tree root
   *	@results:	where the results of the lookup are placed
6328650bb   Hugh Dickins   radix_tree: excep...
1657
   *	@indices:	where their indices should be placed (but usually NULL)
47feff2c8   Nick Piggin   radix-tree: add g...
1658
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
   *	@first_index:	start the lookup from this key
   *	@max_items:	place up to this many items at *results
   *
   *	Performs an index-ascending scan of the tree for present items.  Places
   *	their slots at *@results and returns the number of items which were
   *	placed at *@results.
   *
   *	The implementation is naive.
   *
   *	Like radix_tree_gang_lookup as far as RCU and locking goes. Slots must
   *	be dereferenced with radix_tree_deref_slot, and if using only RCU
   *	protection, radix_tree_deref_slot may fail requiring a retry.
   */
  unsigned int
6328650bb   Hugh Dickins   radix_tree: excep...
1672
1673
  radix_tree_gang_lookup_slot(struct radix_tree_root *root,
  			void ***results, unsigned long *indices,
47feff2c8   Nick Piggin   radix-tree: add g...
1674
1675
  			unsigned long first_index, unsigned int max_items)
  {
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1676
1677
1678
  	struct radix_tree_iter iter;
  	void **slot;
  	unsigned int ret = 0;
47feff2c8   Nick Piggin   radix-tree: add g...
1679

cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1680
  	if (unlikely(!max_items))
47feff2c8   Nick Piggin   radix-tree: add g...
1681
  		return 0;
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1682
1683
  	radix_tree_for_each_slot(slot, root, &iter, first_index) {
  		results[ret] = slot;
6328650bb   Hugh Dickins   radix_tree: excep...
1684
  		if (indices)
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1685
1686
  			indices[ret] = iter.index;
  		if (++ret == max_items)
47feff2c8   Nick Piggin   radix-tree: add g...
1687
  			break;
47feff2c8   Nick Piggin   radix-tree: add g...
1688
1689
1690
1691
1692
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(radix_tree_gang_lookup_slot);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1693
1694
1695
1696
1697
1698
1699
  /**
   *	radix_tree_gang_lookup_tag - perform multiple lookup on a radix tree
   *	                             based on a tag
   *	@root:		radix tree root
   *	@results:	where the results of the lookup are placed
   *	@first_index:	start the lookup from this key
   *	@max_items:	place up to this many items at *results
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1700
   *	@tag:		the tag index (< RADIX_TREE_MAX_TAGS)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1701
1702
1703
1704
1705
1706
1707
   *
   *	Performs an index-ascending scan of the tree for present items which
   *	have the tag indexed by @tag set.  Places the items at *@results and
   *	returns the number of items which were placed at *@results.
   */
  unsigned int
  radix_tree_gang_lookup_tag(struct radix_tree_root *root, void **results,
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1708
1709
  		unsigned long first_index, unsigned int max_items,
  		unsigned int tag)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1710
  {
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1711
1712
1713
  	struct radix_tree_iter iter;
  	void **slot;
  	unsigned int ret = 0;
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1714

cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1715
  	if (unlikely(!max_items))
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1716
  		return 0;
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1717
  	radix_tree_for_each_tagged(slot, root, &iter, first_index, tag) {
46437f9a5   Matthew Wilcox   radix-tree: fix r...
1718
  		results[ret] = rcu_dereference_raw(*slot);
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1719
1720
  		if (!results[ret])
  			continue;
b194d16c2   Matthew Wilcox   radix-tree: renam...
1721
  		if (radix_tree_is_internal_node(results[ret])) {
46437f9a5   Matthew Wilcox   radix-tree: fix r...
1722
1723
1724
  			slot = radix_tree_iter_retry(&iter);
  			continue;
  		}
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1725
  		if (++ret == max_items)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1726
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1727
  	}
7cf9c2c76   Nick Piggin   [PATCH] radix-tre...
1728

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1729
1730
1731
1732
1733
  	return ret;
  }
  EXPORT_SYMBOL(radix_tree_gang_lookup_tag);
  
  /**
47feff2c8   Nick Piggin   radix-tree: add g...
1734
1735
1736
1737
1738
1739
1740
1741
1742
1743
1744
1745
1746
1747
1748
1749
1750
   *	radix_tree_gang_lookup_tag_slot - perform multiple slot lookup on a
   *					  radix tree based on a tag
   *	@root:		radix tree root
   *	@results:	where the results of the lookup are placed
   *	@first_index:	start the lookup from this key
   *	@max_items:	place up to this many items at *results
   *	@tag:		the tag index (< RADIX_TREE_MAX_TAGS)
   *
   *	Performs an index-ascending scan of the tree for present items which
   *	have the tag indexed by @tag set.  Places the slots at *@results and
   *	returns the number of slots which were placed at *@results.
   */
  unsigned int
  radix_tree_gang_lookup_tag_slot(struct radix_tree_root *root, void ***results,
  		unsigned long first_index, unsigned int max_items,
  		unsigned int tag)
  {
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1751
1752
1753
  	struct radix_tree_iter iter;
  	void **slot;
  	unsigned int ret = 0;
47feff2c8   Nick Piggin   radix-tree: add g...
1754

cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1755
  	if (unlikely(!max_items))
47feff2c8   Nick Piggin   radix-tree: add g...
1756
  		return 0;
cebbd29e1   Konstantin Khlebnikov   radix-tree: rewri...
1757
1758
1759
  	radix_tree_for_each_tagged(slot, root, &iter, first_index, tag) {
  		results[ret] = slot;
  		if (++ret == max_items)
47feff2c8   Nick Piggin   radix-tree: add g...
1760
  			break;
47feff2c8   Nick Piggin   radix-tree: add g...
1761
1762
1763
1764
1765
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(radix_tree_gang_lookup_tag_slot);
47feff2c8   Nick Piggin   radix-tree: add g...
1766
  /**
139e56166   Johannes Weiner   lib: radix_tree: ...
1767
1768
   *	__radix_tree_delete_node    -    try to free node after clearing a slot
   *	@root:		radix tree root
139e56166   Johannes Weiner   lib: radix_tree: ...
1769
1770
1771
1772
1773
   *	@node:		node containing @index
   *
   *	After clearing the slot at @index in @node from radix tree
   *	rooted at @root, call this function to attempt freeing the
   *	node and shrinking the tree.
139e56166   Johannes Weiner   lib: radix_tree: ...
1774
   */
14b468791   Johannes Weiner   mm: workingset: m...
1775
  void __radix_tree_delete_node(struct radix_tree_root *root,
139e56166   Johannes Weiner   lib: radix_tree: ...
1776
1777
  			      struct radix_tree_node *node)
  {
14b468791   Johannes Weiner   mm: workingset: m...
1778
  	delete_node(root, node, NULL, NULL);
139e56166   Johannes Weiner   lib: radix_tree: ...
1779
1780
1781
  }
  
  /**
53c59f262   Johannes Weiner   lib: radix-tree: ...
1782
   *	radix_tree_delete_item    -    delete an item from a radix tree
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1783
1784
   *	@root:		radix tree root
   *	@index:		index key
53c59f262   Johannes Weiner   lib: radix-tree: ...
1785
   *	@item:		expected item
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1786
   *
53c59f262   Johannes Weiner   lib: radix-tree: ...
1787
   *	Remove @item at @index from the radix tree rooted at @root.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1788
   *
53c59f262   Johannes Weiner   lib: radix-tree: ...
1789
1790
   *	Returns the address of the deleted item, or NULL if it was not present
   *	or the entry at the given @index was not @item.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1791
   */
53c59f262   Johannes Weiner   lib: radix-tree: ...
1792
1793
  void *radix_tree_delete_item(struct radix_tree_root *root,
  			     unsigned long index, void *item)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1794
  {
139e56166   Johannes Weiner   lib: radix_tree: ...
1795
  	struct radix_tree_node *node;
57578c2ea   Matthew Wilcox   raxix-tree: intro...
1796
  	unsigned int offset;
139e56166   Johannes Weiner   lib: radix_tree: ...
1797
1798
  	void **slot;
  	void *entry;
d5274261e   Nick Piggin   [PATCH] radix tre...
1799
  	int tag;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1800

139e56166   Johannes Weiner   lib: radix_tree: ...
1801
1802
1803
  	entry = __radix_tree_lookup(root, index, &node, &slot);
  	if (!entry)
  		return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1804

139e56166   Johannes Weiner   lib: radix_tree: ...
1805
1806
1807
1808
  	if (item && entry != item)
  		return NULL;
  
  	if (!node) {
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1809
1810
  		root_tag_clear_all(root);
  		root->rnode = NULL;
139e56166   Johannes Weiner   lib: radix_tree: ...
1811
  		return entry;
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1812
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1813

29e0967c2   Matthew Wilcox   radix-tree: fix d...
1814
  	offset = get_slot_offset(node, slot);
53c59f262   Johannes Weiner   lib: radix-tree: ...
1815

d604c3245   Matthew Wilcox   radix-tree: intro...
1816
1817
1818
  	/* Clear all tags associated with the item to be deleted.  */
  	for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  		node_tag_clear(root, node, tag, offset);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1819

4d693d086   Johannes Weiner   lib: radix-tree: ...
1820
  	__radix_tree_replace(root, node, slot, NULL, NULL, NULL);
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1821

139e56166   Johannes Weiner   lib: radix_tree: ...
1822
  	return entry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1823
  }
53c59f262   Johannes Weiner   lib: radix-tree: ...
1824
1825
1826
1827
1828
1829
1830
1831
1832
1833
1834
1835
1836
1837
1838
  EXPORT_SYMBOL(radix_tree_delete_item);
  
  /**
   *	radix_tree_delete    -    delete an item from a radix tree
   *	@root:		radix tree root
   *	@index:		index key
   *
   *	Remove the item at @index from the radix tree rooted at @root.
   *
   *	Returns the address of the deleted item, or NULL if it was not present.
   */
  void *radix_tree_delete(struct radix_tree_root *root, unsigned long index)
  {
  	return radix_tree_delete_item(root, index, NULL);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1839
  EXPORT_SYMBOL(radix_tree_delete);
d3798ae8c   Johannes Weiner   mm: filemap: don'...
1840
1841
1842
  void radix_tree_clear_tags(struct radix_tree_root *root,
  			   struct radix_tree_node *node,
  			   void **slot)
d604c3245   Matthew Wilcox   radix-tree: intro...
1843
  {
d604c3245   Matthew Wilcox   radix-tree: intro...
1844
1845
1846
1847
1848
1849
1850
1851
  	if (node) {
  		unsigned int tag, offset = get_slot_offset(node, slot);
  		for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
  			node_tag_clear(root, node, tag, offset);
  	} else {
  		/* Clear root node tags */
  		root->gfp_mask &= __GFP_BITS_MASK;
  	}
d604c3245   Matthew Wilcox   radix-tree: intro...
1852
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1853
1854
1855
1856
1857
  /**
   *	radix_tree_tagged - test whether any items in the tree are tagged
   *	@root:		radix tree root
   *	@tag:		tag to test
   */
daff89f32   Jonathan Corbet   [PATCH] radix-tre...
1858
  int radix_tree_tagged(struct radix_tree_root *root, unsigned int tag)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1859
  {
612d6c19d   Nick Piggin   [PATCH] radix-tre...
1860
  	return root_tag_get(root, tag);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1861
1862
1863
1864
  }
  EXPORT_SYMBOL(radix_tree_tagged);
  
  static void
449dd6984   Johannes Weiner   mm: keep page cac...
1865
  radix_tree_node_ctor(void *arg)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1866
  {
449dd6984   Johannes Weiner   mm: keep page cac...
1867
1868
1869
1870
  	struct radix_tree_node *node = arg;
  
  	memset(node, 0, sizeof(*node));
  	INIT_LIST_HEAD(&node->private_list);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1871
  }
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
1872
1873
1874
1875
1876
1877
1878
1879
1880
1881
1882
1883
1884
1885
1886
1887
1888
1889
1890
1891
1892
1893
1894
1895
  static __init unsigned long __maxindex(unsigned int height)
  {
  	unsigned int width = height * RADIX_TREE_MAP_SHIFT;
  	int shift = RADIX_TREE_INDEX_BITS - width;
  
  	if (shift < 0)
  		return ~0UL;
  	if (shift >= BITS_PER_LONG)
  		return 0UL;
  	return ~0UL >> shift;
  }
  
  static __init void radix_tree_init_maxnodes(void)
  {
  	unsigned long height_to_maxindex[RADIX_TREE_MAX_PATH + 1];
  	unsigned int i, j;
  
  	for (i = 0; i < ARRAY_SIZE(height_to_maxindex); i++)
  		height_to_maxindex[i] = __maxindex(i);
  	for (i = 0; i < ARRAY_SIZE(height_to_maxnodes); i++) {
  		for (j = i; j > 0; j--)
  			height_to_maxnodes[i] += height_to_maxindex[j - 1] + 1;
  	}
  }
d544abd5f   Sebastian Andrzej Siewior   lib/radix-tree: C...
1896
  static int radix_tree_cpu_dead(unsigned int cpu)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1897
  {
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1898
1899
1900
1901
  	struct radix_tree_preload *rtp;
  	struct radix_tree_node *node;
  
  	/* Free per-cpu pool of preloaded nodes */
d544abd5f   Sebastian Andrzej Siewior   lib/radix-tree: C...
1902
1903
1904
1905
1906
1907
  	rtp = &per_cpu(radix_tree_preloads, cpu);
  	while (rtp->nr) {
  		node = rtp->nodes;
  		rtp->nodes = node->private_data;
  		kmem_cache_free(radix_tree_node_cachep, node);
  		rtp->nr--;
2fcd9005c   Matthew Wilcox   radix-tree: misce...
1908
  	}
d544abd5f   Sebastian Andrzej Siewior   lib/radix-tree: C...
1909
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1910
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1911
1912
1913
  
  void __init radix_tree_init(void)
  {
d544abd5f   Sebastian Andrzej Siewior   lib/radix-tree: C...
1914
  	int ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1915
1916
  	radix_tree_node_cachep = kmem_cache_create("radix_tree_node",
  			sizeof(struct radix_tree_node), 0,
488514d17   Christoph Lameter   Remove set_migrat...
1917
1918
  			SLAB_PANIC | SLAB_RECLAIM_ACCOUNT,
  			radix_tree_node_ctor);
c78c66d1d   Kirill A. Shutemov   radix-tree: imple...
1919
  	radix_tree_init_maxnodes();
d544abd5f   Sebastian Andrzej Siewior   lib/radix-tree: C...
1920
1921
1922
  	ret = cpuhp_setup_state_nocalls(CPUHP_RADIX_DEAD, "lib/radix:dead",
  					NULL, radix_tree_cpu_dead);
  	WARN_ON(ret < 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1923
  }