idr: fix top layer handling
[linux-2.6-block.git] / lib / idr.c
CommitLineData
1da177e4
LT
1/*
2 * 2002-10-18 written by Jim Houston jim.houston@ccur.com
3 * Copyright (C) 2002 by Concurrent Computer Corporation
4 * Distributed under the GNU GPL license version 2.
5 *
6 * Modified by George Anzinger to reuse immediately and to use
7 * find bit instructions. Also removed _irq on spinlocks.
8 *
3219b3b7
ND
9 * Modified by Nadia Derbey to make it RCU safe.
10 *
e15ae2dd 11 * Small id to pointer translation service.
1da177e4 12 *
e15ae2dd 13 * It uses a radix tree like structure as a sparse array indexed
1da177e4 14 * by the id to obtain the pointer. The bitmap makes allocating
e15ae2dd 15 * a new id quick.
1da177e4
LT
16 *
17 * You call it to allocate an id (an int) an associate with that id a
18 * pointer or what ever, we treat it as a (void *). You can pass this
19 * id to a user for him to pass back at a later time. You then pass
20 * that id to this code and it returns your pointer.
21
e15ae2dd 22 * You can release ids at any time. When all ids are released, most of
125c4c70 23 * the memory is returned (we keep MAX_IDR_FREE) in a local pool so we
e15ae2dd 24 * don't need to go to the memory "store" during an id allocate, just
1da177e4
LT
25 * so you don't need to be too concerned about locking and conflicts
26 * with the slab allocator.
27 */
28
29#ifndef TEST // to test in user space...
30#include <linux/slab.h>
31#include <linux/init.h>
8bc3bcc9 32#include <linux/export.h>
1da177e4 33#endif
5806f07c 34#include <linux/err.h>
1da177e4
LT
35#include <linux/string.h>
36#include <linux/idr.h>
88eca020 37#include <linux/spinlock.h>
d5c7409f
TH
38#include <linux/percpu.h>
39#include <linux/hardirq.h>
1da177e4 40
e18b890b 41static struct kmem_cache *idr_layer_cache;
d5c7409f
TH
42static DEFINE_PER_CPU(struct idr_layer *, idr_preload_head);
43static DEFINE_PER_CPU(int, idr_preload_cnt);
88eca020 44static DEFINE_SPINLOCK(simple_ida_lock);
1da177e4 45
326cf0f0
TH
46/* the maximum ID which can be allocated given idr->layers */
47static int idr_max(int layers)
48{
49 int bits = min_t(int, layers * IDR_BITS, MAX_IDR_SHIFT);
50
51 return (1 << bits) - 1;
52}
53
4ae53789 54static struct idr_layer *get_from_free_list(struct idr *idp)
1da177e4
LT
55{
56 struct idr_layer *p;
c259cc28 57 unsigned long flags;
1da177e4 58
c259cc28 59 spin_lock_irqsave(&idp->lock, flags);
1da177e4
LT
60 if ((p = idp->id_free)) {
61 idp->id_free = p->ary[0];
62 idp->id_free_cnt--;
63 p->ary[0] = NULL;
64 }
c259cc28 65 spin_unlock_irqrestore(&idp->lock, flags);
1da177e4
LT
66 return(p);
67}
68
d5c7409f
TH
69/**
70 * idr_layer_alloc - allocate a new idr_layer
71 * @gfp_mask: allocation mask
72 * @layer_idr: optional idr to allocate from
73 *
74 * If @layer_idr is %NULL, directly allocate one using @gfp_mask or fetch
75 * one from the per-cpu preload buffer. If @layer_idr is not %NULL, fetch
76 * an idr_layer from @idr->id_free.
77 *
78 * @layer_idr is to maintain backward compatibility with the old alloc
79 * interface - idr_pre_get() and idr_get_new*() - and will be removed
80 * together with per-pool preload buffer.
81 */
82static struct idr_layer *idr_layer_alloc(gfp_t gfp_mask, struct idr *layer_idr)
83{
84 struct idr_layer *new;
85
86 /* this is the old path, bypass to get_from_free_list() */
87 if (layer_idr)
88 return get_from_free_list(layer_idr);
89
90 /* try to allocate directly from kmem_cache */
91 new = kmem_cache_zalloc(idr_layer_cache, gfp_mask);
92 if (new)
93 return new;
94
95 /*
96 * Try to fetch one from the per-cpu preload buffer if in process
97 * context. See idr_preload() for details.
98 */
99 if (in_interrupt())
100 return NULL;
101
102 preempt_disable();
103 new = __this_cpu_read(idr_preload_head);
104 if (new) {
105 __this_cpu_write(idr_preload_head, new->ary[0]);
106 __this_cpu_dec(idr_preload_cnt);
107 new->ary[0] = NULL;
108 }
109 preempt_enable();
110 return new;
111}
112
cf481c20
ND
113static void idr_layer_rcu_free(struct rcu_head *head)
114{
115 struct idr_layer *layer;
116
117 layer = container_of(head, struct idr_layer, rcu_head);
118 kmem_cache_free(idr_layer_cache, layer);
119}
120
121static inline void free_layer(struct idr_layer *p)
122{
123 call_rcu(&p->rcu_head, idr_layer_rcu_free);
124}
125
1eec0056 126/* only called when idp->lock is held */
4ae53789 127static void __move_to_free_list(struct idr *idp, struct idr_layer *p)
1eec0056
SR
128{
129 p->ary[0] = idp->id_free;
130 idp->id_free = p;
131 idp->id_free_cnt++;
132}
133
4ae53789 134static void move_to_free_list(struct idr *idp, struct idr_layer *p)
1da177e4 135{
c259cc28
RD
136 unsigned long flags;
137
1da177e4
LT
138 /*
139 * Depends on the return element being zeroed.
140 */
c259cc28 141 spin_lock_irqsave(&idp->lock, flags);
4ae53789 142 __move_to_free_list(idp, p);
c259cc28 143 spin_unlock_irqrestore(&idp->lock, flags);
1da177e4
LT
144}
145
e33ac8bd
TH
146static void idr_mark_full(struct idr_layer **pa, int id)
147{
148 struct idr_layer *p = pa[0];
149 int l = 0;
150
151 __set_bit(id & IDR_MASK, &p->bitmap);
152 /*
153 * If this layer is full mark the bit in the layer above to
154 * show that this part of the radix tree is full. This may
155 * complete the layer above and require walking up the radix
156 * tree.
157 */
158 while (p->bitmap == IDR_FULL) {
159 if (!(p = pa[++l]))
160 break;
161 id = id >> IDR_BITS;
162 __set_bit((id & IDR_MASK), &p->bitmap);
163 }
164}
165
1da177e4 166/**
56083ab1 167 * idr_pre_get - reserve resources for idr allocation
1da177e4
LT
168 * @idp: idr handle
169 * @gfp_mask: memory allocation flags
170 *
066a9be6
NA
171 * This function should be called prior to calling the idr_get_new* functions.
172 * It preallocates enough memory to satisfy the worst possible allocation. The
173 * caller should pass in GFP_KERNEL if possible. This of course requires that
174 * no spinning locks be held.
1da177e4 175 *
56083ab1
RD
176 * If the system is REALLY out of memory this function returns %0,
177 * otherwise %1.
1da177e4 178 */
fd4f2df2 179int idr_pre_get(struct idr *idp, gfp_t gfp_mask)
1da177e4 180{
125c4c70 181 while (idp->id_free_cnt < MAX_IDR_FREE) {
1da177e4 182 struct idr_layer *new;
5b019e99 183 new = kmem_cache_zalloc(idr_layer_cache, gfp_mask);
e15ae2dd 184 if (new == NULL)
1da177e4 185 return (0);
4ae53789 186 move_to_free_list(idp, new);
1da177e4
LT
187 }
188 return 1;
189}
190EXPORT_SYMBOL(idr_pre_get);
191
12d1b439
TH
192/**
193 * sub_alloc - try to allocate an id without growing the tree depth
194 * @idp: idr handle
195 * @starting_id: id to start search at
196 * @id: pointer to the allocated handle
197 * @pa: idr_layer[MAX_IDR_LEVEL] used as backtrack buffer
d5c7409f
TH
198 * @gfp_mask: allocation mask for idr_layer_alloc()
199 * @layer_idr: optional idr passed to idr_layer_alloc()
12d1b439
TH
200 *
201 * Allocate an id in range [@starting_id, INT_MAX] from @idp without
202 * growing its depth. Returns
203 *
204 * the allocated id >= 0 if successful,
205 * -EAGAIN if the tree needs to grow for allocation to succeed,
206 * -ENOSPC if the id space is exhausted,
207 * -ENOMEM if more idr_layers need to be allocated.
208 */
d5c7409f
TH
209static int sub_alloc(struct idr *idp, int *starting_id, struct idr_layer **pa,
210 gfp_t gfp_mask, struct idr *layer_idr)
1da177e4
LT
211{
212 int n, m, sh;
213 struct idr_layer *p, *new;
7aae6dd8 214 int l, id, oid;
5ba25331 215 unsigned long bm;
1da177e4
LT
216
217 id = *starting_id;
7aae6dd8 218 restart:
1da177e4
LT
219 p = idp->top;
220 l = idp->layers;
221 pa[l--] = NULL;
222 while (1) {
223 /*
224 * We run around this while until we reach the leaf node...
225 */
226 n = (id >> (IDR_BITS*l)) & IDR_MASK;
227 bm = ~p->bitmap;
228 m = find_next_bit(&bm, IDR_SIZE, n);
229 if (m == IDR_SIZE) {
230 /* no space available go back to previous layer. */
231 l++;
7aae6dd8 232 oid = id;
e15ae2dd 233 id = (id | ((1 << (IDR_BITS * l)) - 1)) + 1;
7aae6dd8
TH
234
235 /* if already at the top layer, we need to grow */
d2e7276b 236 if (id >= 1 << (idp->layers * IDR_BITS)) {
1da177e4 237 *starting_id = id;
12d1b439 238 return -EAGAIN;
1da177e4 239 }
d2e7276b
TH
240 p = pa[l];
241 BUG_ON(!p);
7aae6dd8
TH
242
243 /* If we need to go up one layer, continue the
244 * loop; otherwise, restart from the top.
245 */
246 sh = IDR_BITS * (l + 1);
247 if (oid >> sh == id >> sh)
248 continue;
249 else
250 goto restart;
1da177e4
LT
251 }
252 if (m != n) {
253 sh = IDR_BITS*l;
254 id = ((id >> sh) ^ n ^ m) << sh;
255 }
125c4c70 256 if ((id >= MAX_IDR_BIT) || (id < 0))
12d1b439 257 return -ENOSPC;
1da177e4
LT
258 if (l == 0)
259 break;
260 /*
261 * Create the layer below if it is missing.
262 */
263 if (!p->ary[m]) {
d5c7409f 264 new = idr_layer_alloc(gfp_mask, layer_idr);
4ae53789 265 if (!new)
12d1b439 266 return -ENOMEM;
6ff2d39b 267 new->layer = l-1;
3219b3b7 268 rcu_assign_pointer(p->ary[m], new);
1da177e4
LT
269 p->count++;
270 }
271 pa[l--] = p;
272 p = p->ary[m];
273 }
e33ac8bd
TH
274
275 pa[l] = p;
276 return id;
1da177e4
LT
277}
278
e33ac8bd 279static int idr_get_empty_slot(struct idr *idp, int starting_id,
d5c7409f
TH
280 struct idr_layer **pa, gfp_t gfp_mask,
281 struct idr *layer_idr)
1da177e4
LT
282{
283 struct idr_layer *p, *new;
284 int layers, v, id;
c259cc28 285 unsigned long flags;
e15ae2dd 286
1da177e4
LT
287 id = starting_id;
288build_up:
289 p = idp->top;
290 layers = idp->layers;
291 if (unlikely(!p)) {
d5c7409f 292 if (!(p = idr_layer_alloc(gfp_mask, layer_idr)))
12d1b439 293 return -ENOMEM;
6ff2d39b 294 p->layer = 0;
1da177e4
LT
295 layers = 1;
296 }
297 /*
298 * Add a new layer to the top of the tree if the requested
299 * id is larger than the currently allocated space.
300 */
326cf0f0 301 while (id > idr_max(layers)) {
1da177e4 302 layers++;
711a49a0
MS
303 if (!p->count) {
304 /* special case: if the tree is currently empty,
305 * then we grow the tree by moving the top node
306 * upwards.
307 */
308 p->layer++;
1da177e4 309 continue;
711a49a0 310 }
d5c7409f 311 if (!(new = idr_layer_alloc(gfp_mask, layer_idr))) {
1da177e4
LT
312 /*
313 * The allocation failed. If we built part of
314 * the structure tear it down.
315 */
c259cc28 316 spin_lock_irqsave(&idp->lock, flags);
1da177e4
LT
317 for (new = p; p && p != idp->top; new = p) {
318 p = p->ary[0];
319 new->ary[0] = NULL;
320 new->bitmap = new->count = 0;
4ae53789 321 __move_to_free_list(idp, new);
1da177e4 322 }
c259cc28 323 spin_unlock_irqrestore(&idp->lock, flags);
12d1b439 324 return -ENOMEM;
1da177e4
LT
325 }
326 new->ary[0] = p;
327 new->count = 1;
6ff2d39b 328 new->layer = layers-1;
1da177e4
LT
329 if (p->bitmap == IDR_FULL)
330 __set_bit(0, &new->bitmap);
331 p = new;
332 }
3219b3b7 333 rcu_assign_pointer(idp->top, p);
1da177e4 334 idp->layers = layers;
d5c7409f 335 v = sub_alloc(idp, &id, pa, gfp_mask, layer_idr);
12d1b439 336 if (v == -EAGAIN)
1da177e4
LT
337 goto build_up;
338 return(v);
339}
340
3594eb28
TH
341/*
342 * @id and @pa are from a successful allocation from idr_get_empty_slot().
343 * Install the user pointer @ptr and mark the slot full.
344 */
345static void idr_fill_slot(void *ptr, int id, struct idr_layer **pa)
e33ac8bd 346{
3594eb28
TH
347 rcu_assign_pointer(pa[0]->ary[id & IDR_MASK], (struct idr_layer *)ptr);
348 pa[0]->count++;
349 idr_mark_full(pa, id);
e33ac8bd
TH
350}
351
1da177e4 352/**
7c657f2f 353 * idr_get_new_above - allocate new idr entry above or equal to a start id
1da177e4 354 * @idp: idr handle
94e2bd68 355 * @ptr: pointer you want associated with the id
ea24ea85 356 * @starting_id: id to start search at
1da177e4
LT
357 * @id: pointer to the allocated handle
358 *
359 * This is the allocate id function. It should be called with any
360 * required locks.
361 *
066a9be6 362 * If allocation from IDR's private freelist fails, idr_get_new_above() will
56083ab1 363 * return %-EAGAIN. The caller should retry the idr_pre_get() call to refill
066a9be6
NA
364 * IDR's preallocation and then retry the idr_get_new_above() call.
365 *
56083ab1 366 * If the idr is full idr_get_new_above() will return %-ENOSPC.
1da177e4 367 *
56083ab1 368 * @id returns a value in the range @starting_id ... %0x7fffffff
1da177e4
LT
369 */
370int idr_get_new_above(struct idr *idp, void *ptr, int starting_id, int *id)
371{
326cf0f0 372 struct idr_layer *pa[MAX_IDR_LEVEL + 1];
1da177e4 373 int rv;
e15ae2dd 374
d5c7409f 375 rv = idr_get_empty_slot(idp, starting_id, pa, 0, idp);
944ca05c 376 if (rv < 0)
12d1b439 377 return rv == -ENOMEM ? -EAGAIN : rv;
3594eb28
TH
378
379 idr_fill_slot(ptr, rv, pa);
1da177e4
LT
380 *id = rv;
381 return 0;
382}
383EXPORT_SYMBOL(idr_get_new_above);
384
d5c7409f
TH
385/**
386 * idr_preload - preload for idr_alloc()
387 * @gfp_mask: allocation mask to use for preloading
388 *
389 * Preload per-cpu layer buffer for idr_alloc(). Can only be used from
390 * process context and each idr_preload() invocation should be matched with
391 * idr_preload_end(). Note that preemption is disabled while preloaded.
392 *
393 * The first idr_alloc() in the preloaded section can be treated as if it
394 * were invoked with @gfp_mask used for preloading. This allows using more
395 * permissive allocation masks for idrs protected by spinlocks.
396 *
397 * For example, if idr_alloc() below fails, the failure can be treated as
398 * if idr_alloc() were called with GFP_KERNEL rather than GFP_NOWAIT.
399 *
400 * idr_preload(GFP_KERNEL);
401 * spin_lock(lock);
402 *
403 * id = idr_alloc(idr, ptr, start, end, GFP_NOWAIT);
404 *
405 * spin_unlock(lock);
406 * idr_preload_end();
407 * if (id < 0)
408 * error;
409 */
410void idr_preload(gfp_t gfp_mask)
411{
412 /*
413 * Consuming preload buffer from non-process context breaks preload
414 * allocation guarantee. Disallow usage from those contexts.
415 */
416 WARN_ON_ONCE(in_interrupt());
417 might_sleep_if(gfp_mask & __GFP_WAIT);
418
419 preempt_disable();
420
421 /*
422 * idr_alloc() is likely to succeed w/o full idr_layer buffer and
423 * return value from idr_alloc() needs to be checked for failure
424 * anyway. Silently give up if allocation fails. The caller can
425 * treat failures from idr_alloc() as if idr_alloc() were called
426 * with @gfp_mask which should be enough.
427 */
428 while (__this_cpu_read(idr_preload_cnt) < MAX_IDR_FREE) {
429 struct idr_layer *new;
430
431 preempt_enable();
432 new = kmem_cache_zalloc(idr_layer_cache, gfp_mask);
433 preempt_disable();
434 if (!new)
435 break;
436
437 /* link the new one to per-cpu preload list */
438 new->ary[0] = __this_cpu_read(idr_preload_head);
439 __this_cpu_write(idr_preload_head, new);
440 __this_cpu_inc(idr_preload_cnt);
441 }
442}
443EXPORT_SYMBOL(idr_preload);
444
445/**
446 * idr_alloc - allocate new idr entry
447 * @idr: the (initialized) idr
448 * @ptr: pointer to be associated with the new id
449 * @start: the minimum id (inclusive)
450 * @end: the maximum id (exclusive, <= 0 for max)
451 * @gfp_mask: memory allocation flags
452 *
453 * Allocate an id in [start, end) and associate it with @ptr. If no ID is
454 * available in the specified range, returns -ENOSPC. On memory allocation
455 * failure, returns -ENOMEM.
456 *
457 * Note that @end is treated as max when <= 0. This is to always allow
458 * using @start + N as @end as long as N is inside integer range.
459 *
460 * The user is responsible for exclusively synchronizing all operations
461 * which may modify @idr. However, read-only accesses such as idr_find()
462 * or iteration can be performed under RCU read lock provided the user
463 * destroys @ptr in RCU-safe way after removal from idr.
464 */
465int idr_alloc(struct idr *idr, void *ptr, int start, int end, gfp_t gfp_mask)
466{
467 int max = end > 0 ? end - 1 : INT_MAX; /* inclusive upper limit */
326cf0f0 468 struct idr_layer *pa[MAX_IDR_LEVEL + 1];
d5c7409f
TH
469 int id;
470
471 might_sleep_if(gfp_mask & __GFP_WAIT);
472
473 /* sanity checks */
474 if (WARN_ON_ONCE(start < 0))
475 return -EINVAL;
476 if (unlikely(max < start))
477 return -ENOSPC;
478
479 /* allocate id */
480 id = idr_get_empty_slot(idr, start, pa, gfp_mask, NULL);
481 if (unlikely(id < 0))
482 return id;
483 if (unlikely(id > max))
484 return -ENOSPC;
485
486 idr_fill_slot(ptr, id, pa);
487 return id;
488}
489EXPORT_SYMBOL_GPL(idr_alloc);
490
1da177e4
LT
491static void idr_remove_warning(int id)
492{
f098ad65
ND
493 printk(KERN_WARNING
494 "idr_remove called for id=%d which is not allocated.\n", id);
1da177e4
LT
495 dump_stack();
496}
497
498static void sub_remove(struct idr *idp, int shift, int id)
499{
500 struct idr_layer *p = idp->top;
326cf0f0 501 struct idr_layer **pa[MAX_IDR_LEVEL + 1];
1da177e4 502 struct idr_layer ***paa = &pa[0];
cf481c20 503 struct idr_layer *to_free;
1da177e4
LT
504 int n;
505
506 *paa = NULL;
507 *++paa = &idp->top;
508
509 while ((shift > 0) && p) {
510 n = (id >> shift) & IDR_MASK;
511 __clear_bit(n, &p->bitmap);
512 *++paa = &p->ary[n];
513 p = p->ary[n];
514 shift -= IDR_BITS;
515 }
516 n = id & IDR_MASK;
517 if (likely(p != NULL && test_bit(n, &p->bitmap))){
518 __clear_bit(n, &p->bitmap);
cf481c20
ND
519 rcu_assign_pointer(p->ary[n], NULL);
520 to_free = NULL;
1da177e4 521 while(*paa && ! --((**paa)->count)){
cf481c20
ND
522 if (to_free)
523 free_layer(to_free);
524 to_free = **paa;
1da177e4
LT
525 **paa-- = NULL;
526 }
e15ae2dd 527 if (!*paa)
1da177e4 528 idp->layers = 0;
cf481c20
ND
529 if (to_free)
530 free_layer(to_free);
e15ae2dd 531 } else
1da177e4 532 idr_remove_warning(id);
1da177e4
LT
533}
534
535/**
56083ab1 536 * idr_remove - remove the given id and free its slot
72fd4a35
RD
537 * @idp: idr handle
538 * @id: unique key
1da177e4
LT
539 */
540void idr_remove(struct idr *idp, int id)
541{
542 struct idr_layer *p;
cf481c20 543 struct idr_layer *to_free;
1da177e4
LT
544
545 /* Mask off upper bits we don't use for the search. */
125c4c70 546 id &= MAX_IDR_MASK;
1da177e4
LT
547
548 sub_remove(idp, (idp->layers - 1) * IDR_BITS, id);
e15ae2dd 549 if (idp->top && idp->top->count == 1 && (idp->layers > 1) &&
cf481c20
ND
550 idp->top->ary[0]) {
551 /*
552 * Single child at leftmost slot: we can shrink the tree.
553 * This level is not needed anymore since when layers are
554 * inserted, they are inserted at the top of the existing
555 * tree.
556 */
557 to_free = idp->top;
1da177e4 558 p = idp->top->ary[0];
cf481c20 559 rcu_assign_pointer(idp->top, p);
1da177e4 560 --idp->layers;
cf481c20
ND
561 to_free->bitmap = to_free->count = 0;
562 free_layer(to_free);
1da177e4 563 }
125c4c70 564 while (idp->id_free_cnt >= MAX_IDR_FREE) {
4ae53789 565 p = get_from_free_list(idp);
cf481c20
ND
566 /*
567 * Note: we don't call the rcu callback here, since the only
568 * layers that fall into the freelist are those that have been
569 * preallocated.
570 */
1da177e4 571 kmem_cache_free(idr_layer_cache, p);
1da177e4 572 }
af8e2a4c 573 return;
1da177e4
LT
574}
575EXPORT_SYMBOL(idr_remove);
576
fe6e24ec 577void __idr_remove_all(struct idr *idp)
23936cc0 578{
6ace06dc 579 int n, id, max;
2dcb22b3 580 int bt_mask;
23936cc0 581 struct idr_layer *p;
326cf0f0 582 struct idr_layer *pa[MAX_IDR_LEVEL + 1];
23936cc0
KH
583 struct idr_layer **paa = &pa[0];
584
585 n = idp->layers * IDR_BITS;
586 p = idp->top;
1b23336a 587 rcu_assign_pointer(idp->top, NULL);
326cf0f0 588 max = idr_max(idp->layers);
23936cc0
KH
589
590 id = 0;
326cf0f0 591 while (id >= 0 && id <= max) {
23936cc0
KH
592 while (n > IDR_BITS && p) {
593 n -= IDR_BITS;
594 *paa++ = p;
595 p = p->ary[(id >> n) & IDR_MASK];
596 }
597
2dcb22b3 598 bt_mask = id;
23936cc0 599 id += 1 << n;
2dcb22b3
ID
600 /* Get the highest bit that the above add changed from 0->1. */
601 while (n < fls(id ^ bt_mask)) {
cf481c20
ND
602 if (p)
603 free_layer(p);
23936cc0
KH
604 n += IDR_BITS;
605 p = *--paa;
606 }
607 }
23936cc0
KH
608 idp->layers = 0;
609}
fe6e24ec 610EXPORT_SYMBOL(__idr_remove_all);
23936cc0 611
8d3b3591
AM
612/**
613 * idr_destroy - release all cached layers within an idr tree
ea24ea85 614 * @idp: idr handle
9bb26bc1
TH
615 *
616 * Free all id mappings and all idp_layers. After this function, @idp is
617 * completely unused and can be freed / recycled. The caller is
618 * responsible for ensuring that no one else accesses @idp during or after
619 * idr_destroy().
620 *
621 * A typical clean-up sequence for objects stored in an idr tree will use
622 * idr_for_each() to free all objects, if necessay, then idr_destroy() to
623 * free up the id mappings and cached idr_layers.
8d3b3591
AM
624 */
625void idr_destroy(struct idr *idp)
626{
fe6e24ec 627 __idr_remove_all(idp);
9bb26bc1 628
8d3b3591 629 while (idp->id_free_cnt) {
4ae53789 630 struct idr_layer *p = get_from_free_list(idp);
8d3b3591
AM
631 kmem_cache_free(idr_layer_cache, p);
632 }
633}
634EXPORT_SYMBOL(idr_destroy);
635
1da177e4
LT
636/**
637 * idr_find - return pointer for given id
638 * @idp: idr handle
639 * @id: lookup key
640 *
641 * Return the pointer given the id it has been registered with. A %NULL
642 * return indicates that @id is not valid or you passed %NULL in
643 * idr_get_new().
644 *
f9c46d6e
ND
645 * This function can be called under rcu_read_lock(), given that the leaf
646 * pointers lifetimes are correctly managed.
1da177e4
LT
647 */
648void *idr_find(struct idr *idp, int id)
649{
650 int n;
651 struct idr_layer *p;
652
96be753a 653 p = rcu_dereference_raw(idp->top);
6ff2d39b
MS
654 if (!p)
655 return NULL;
656 n = (p->layer+1) * IDR_BITS;
1da177e4
LT
657
658 /* Mask off upper bits we don't use for the search. */
125c4c70 659 id &= MAX_IDR_MASK;
1da177e4 660
326cf0f0 661 if (id > idr_max(p->layer + 1))
1da177e4 662 return NULL;
6ff2d39b 663 BUG_ON(n == 0);
1da177e4
LT
664
665 while (n > 0 && p) {
666 n -= IDR_BITS;
6ff2d39b 667 BUG_ON(n != p->layer*IDR_BITS);
96be753a 668 p = rcu_dereference_raw(p->ary[(id >> n) & IDR_MASK]);
1da177e4
LT
669 }
670 return((void *)p);
671}
672EXPORT_SYMBOL(idr_find);
673
96d7fa42
KH
674/**
675 * idr_for_each - iterate through all stored pointers
676 * @idp: idr handle
677 * @fn: function to be called for each pointer
678 * @data: data passed back to callback function
679 *
680 * Iterate over the pointers registered with the given idr. The
681 * callback function will be called for each pointer currently
682 * registered, passing the id, the pointer and the data pointer passed
683 * to this function. It is not safe to modify the idr tree while in
684 * the callback, so functions such as idr_get_new and idr_remove are
685 * not allowed.
686 *
687 * We check the return of @fn each time. If it returns anything other
56083ab1 688 * than %0, we break out and return that value.
96d7fa42
KH
689 *
690 * The caller must serialize idr_for_each() vs idr_get_new() and idr_remove().
691 */
692int idr_for_each(struct idr *idp,
693 int (*fn)(int id, void *p, void *data), void *data)
694{
695 int n, id, max, error = 0;
696 struct idr_layer *p;
326cf0f0 697 struct idr_layer *pa[MAX_IDR_LEVEL + 1];
96d7fa42
KH
698 struct idr_layer **paa = &pa[0];
699
700 n = idp->layers * IDR_BITS;
96be753a 701 p = rcu_dereference_raw(idp->top);
326cf0f0 702 max = idr_max(idp->layers);
96d7fa42
KH
703
704 id = 0;
326cf0f0 705 while (id >= 0 && id <= max) {
96d7fa42
KH
706 while (n > 0 && p) {
707 n -= IDR_BITS;
708 *paa++ = p;
96be753a 709 p = rcu_dereference_raw(p->ary[(id >> n) & IDR_MASK]);
96d7fa42
KH
710 }
711
712 if (p) {
713 error = fn(id, (void *)p, data);
714 if (error)
715 break;
716 }
717
718 id += 1 << n;
719 while (n < fls(id)) {
720 n += IDR_BITS;
721 p = *--paa;
722 }
723 }
724
725 return error;
726}
727EXPORT_SYMBOL(idr_for_each);
728
38460b48
KH
729/**
730 * idr_get_next - lookup next object of id to given id.
731 * @idp: idr handle
ea24ea85 732 * @nextidp: pointer to lookup key
38460b48
KH
733 *
734 * Returns pointer to registered object with id, which is next number to
1458ce16
NA
735 * given id. After being looked up, *@nextidp will be updated for the next
736 * iteration.
9f7de827
HD
737 *
738 * This function can be called under rcu_read_lock(), given that the leaf
739 * pointers lifetimes are correctly managed.
38460b48 740 */
38460b48
KH
741void *idr_get_next(struct idr *idp, int *nextidp)
742{
326cf0f0 743 struct idr_layer *p, *pa[MAX_IDR_LEVEL + 1];
38460b48
KH
744 struct idr_layer **paa = &pa[0];
745 int id = *nextidp;
746 int n, max;
747
748 /* find first ent */
94bfa3b6 749 p = rcu_dereference_raw(idp->top);
38460b48
KH
750 if (!p)
751 return NULL;
9f7de827 752 n = (p->layer + 1) * IDR_BITS;
326cf0f0 753 max = idr_max(p->layer + 1);
38460b48 754
326cf0f0 755 while (id >= 0 && id <= max) {
38460b48
KH
756 while (n > 0 && p) {
757 n -= IDR_BITS;
758 *paa++ = p;
94bfa3b6 759 p = rcu_dereference_raw(p->ary[(id >> n) & IDR_MASK]);
38460b48
KH
760 }
761
762 if (p) {
763 *nextidp = id;
764 return p;
765 }
766
6cdae741
TH
767 /*
768 * Proceed to the next layer at the current level. Unlike
769 * idr_for_each(), @id isn't guaranteed to be aligned to
770 * layer boundary at this point and adding 1 << n may
771 * incorrectly skip IDs. Make sure we jump to the
772 * beginning of the next layer using round_up().
773 */
774 id = round_up(id + 1, 1 << n);
38460b48
KH
775 while (n < fls(id)) {
776 n += IDR_BITS;
777 p = *--paa;
778 }
779 }
780 return NULL;
781}
4d1ee80f 782EXPORT_SYMBOL(idr_get_next);
38460b48
KH
783
784
5806f07c
JM
785/**
786 * idr_replace - replace pointer for given id
787 * @idp: idr handle
788 * @ptr: pointer you want associated with the id
789 * @id: lookup key
790 *
791 * Replace the pointer registered with an id and return the old value.
56083ab1
RD
792 * A %-ENOENT return indicates that @id was not found.
793 * A %-EINVAL return indicates that @id was not within valid constraints.
5806f07c 794 *
cf481c20 795 * The caller must serialize with writers.
5806f07c
JM
796 */
797void *idr_replace(struct idr *idp, void *ptr, int id)
798{
799 int n;
800 struct idr_layer *p, *old_p;
801
5806f07c 802 p = idp->top;
6ff2d39b
MS
803 if (!p)
804 return ERR_PTR(-EINVAL);
805
806 n = (p->layer+1) * IDR_BITS;
5806f07c 807
125c4c70 808 id &= MAX_IDR_MASK;
5806f07c
JM
809
810 if (id >= (1 << n))
811 return ERR_PTR(-EINVAL);
812
813 n -= IDR_BITS;
814 while ((n > 0) && p) {
815 p = p->ary[(id >> n) & IDR_MASK];
816 n -= IDR_BITS;
817 }
818
819 n = id & IDR_MASK;
820 if (unlikely(p == NULL || !test_bit(n, &p->bitmap)))
821 return ERR_PTR(-ENOENT);
822
823 old_p = p->ary[n];
cf481c20 824 rcu_assign_pointer(p->ary[n], ptr);
5806f07c
JM
825
826 return old_p;
827}
828EXPORT_SYMBOL(idr_replace);
829
199f0ca5 830void __init idr_init_cache(void)
1da177e4 831{
199f0ca5 832 idr_layer_cache = kmem_cache_create("idr_layer_cache",
5b019e99 833 sizeof(struct idr_layer), 0, SLAB_PANIC, NULL);
1da177e4
LT
834}
835
836/**
837 * idr_init - initialize idr handle
838 * @idp: idr handle
839 *
840 * This function is use to set up the handle (@idp) that you will pass
841 * to the rest of the functions.
842 */
843void idr_init(struct idr *idp)
844{
1da177e4
LT
845 memset(idp, 0, sizeof(struct idr));
846 spin_lock_init(&idp->lock);
847}
848EXPORT_SYMBOL(idr_init);
72dba584
TH
849
850
56083ab1
RD
851/**
852 * DOC: IDA description
72dba584
TH
853 * IDA - IDR based ID allocator
854 *
56083ab1 855 * This is id allocator without id -> pointer translation. Memory
72dba584
TH
856 * usage is much lower than full blown idr because each id only
857 * occupies a bit. ida uses a custom leaf node which contains
858 * IDA_BITMAP_BITS slots.
859 *
860 * 2007-04-25 written by Tejun Heo <htejun@gmail.com>
861 */
862
863static void free_bitmap(struct ida *ida, struct ida_bitmap *bitmap)
864{
865 unsigned long flags;
866
867 if (!ida->free_bitmap) {
868 spin_lock_irqsave(&ida->idr.lock, flags);
869 if (!ida->free_bitmap) {
870 ida->free_bitmap = bitmap;
871 bitmap = NULL;
872 }
873 spin_unlock_irqrestore(&ida->idr.lock, flags);
874 }
875
876 kfree(bitmap);
877}
878
879/**
880 * ida_pre_get - reserve resources for ida allocation
881 * @ida: ida handle
882 * @gfp_mask: memory allocation flag
883 *
884 * This function should be called prior to locking and calling the
885 * following function. It preallocates enough memory to satisfy the
886 * worst possible allocation.
887 *
56083ab1
RD
888 * If the system is REALLY out of memory this function returns %0,
889 * otherwise %1.
72dba584
TH
890 */
891int ida_pre_get(struct ida *ida, gfp_t gfp_mask)
892{
893 /* allocate idr_layers */
894 if (!idr_pre_get(&ida->idr, gfp_mask))
895 return 0;
896
897 /* allocate free_bitmap */
898 if (!ida->free_bitmap) {
899 struct ida_bitmap *bitmap;
900
901 bitmap = kmalloc(sizeof(struct ida_bitmap), gfp_mask);
902 if (!bitmap)
903 return 0;
904
905 free_bitmap(ida, bitmap);
906 }
907
908 return 1;
909}
910EXPORT_SYMBOL(ida_pre_get);
911
912/**
913 * ida_get_new_above - allocate new ID above or equal to a start id
914 * @ida: ida handle
ea24ea85 915 * @starting_id: id to start search at
72dba584
TH
916 * @p_id: pointer to the allocated handle
917 *
e3816c54
WSH
918 * Allocate new ID above or equal to @starting_id. It should be called
919 * with any required locks.
72dba584 920 *
56083ab1 921 * If memory is required, it will return %-EAGAIN, you should unlock
72dba584 922 * and go back to the ida_pre_get() call. If the ida is full, it will
56083ab1 923 * return %-ENOSPC.
72dba584 924 *
56083ab1 925 * @p_id returns a value in the range @starting_id ... %0x7fffffff.
72dba584
TH
926 */
927int ida_get_new_above(struct ida *ida, int starting_id, int *p_id)
928{
326cf0f0 929 struct idr_layer *pa[MAX_IDR_LEVEL + 1];
72dba584
TH
930 struct ida_bitmap *bitmap;
931 unsigned long flags;
932 int idr_id = starting_id / IDA_BITMAP_BITS;
933 int offset = starting_id % IDA_BITMAP_BITS;
934 int t, id;
935
936 restart:
937 /* get vacant slot */
d5c7409f 938 t = idr_get_empty_slot(&ida->idr, idr_id, pa, 0, &ida->idr);
944ca05c 939 if (t < 0)
12d1b439 940 return t == -ENOMEM ? -EAGAIN : t;
72dba584 941
125c4c70 942 if (t * IDA_BITMAP_BITS >= MAX_IDR_BIT)
72dba584
TH
943 return -ENOSPC;
944
945 if (t != idr_id)
946 offset = 0;
947 idr_id = t;
948
949 /* if bitmap isn't there, create a new one */
950 bitmap = (void *)pa[0]->ary[idr_id & IDR_MASK];
951 if (!bitmap) {
952 spin_lock_irqsave(&ida->idr.lock, flags);
953 bitmap = ida->free_bitmap;
954 ida->free_bitmap = NULL;
955 spin_unlock_irqrestore(&ida->idr.lock, flags);
956
957 if (!bitmap)
958 return -EAGAIN;
959
960 memset(bitmap, 0, sizeof(struct ida_bitmap));
3219b3b7
ND
961 rcu_assign_pointer(pa[0]->ary[idr_id & IDR_MASK],
962 (void *)bitmap);
72dba584
TH
963 pa[0]->count++;
964 }
965
966 /* lookup for empty slot */
967 t = find_next_zero_bit(bitmap->bitmap, IDA_BITMAP_BITS, offset);
968 if (t == IDA_BITMAP_BITS) {
969 /* no empty slot after offset, continue to the next chunk */
970 idr_id++;
971 offset = 0;
972 goto restart;
973 }
974
975 id = idr_id * IDA_BITMAP_BITS + t;
125c4c70 976 if (id >= MAX_IDR_BIT)
72dba584
TH
977 return -ENOSPC;
978
979 __set_bit(t, bitmap->bitmap);
980 if (++bitmap->nr_busy == IDA_BITMAP_BITS)
981 idr_mark_full(pa, idr_id);
982
983 *p_id = id;
984
985 /* Each leaf node can handle nearly a thousand slots and the
986 * whole idea of ida is to have small memory foot print.
987 * Throw away extra resources one by one after each successful
988 * allocation.
989 */
990 if (ida->idr.id_free_cnt || ida->free_bitmap) {
4ae53789 991 struct idr_layer *p = get_from_free_list(&ida->idr);
72dba584
TH
992 if (p)
993 kmem_cache_free(idr_layer_cache, p);
994 }
995
996 return 0;
997}
998EXPORT_SYMBOL(ida_get_new_above);
999
72dba584
TH
1000/**
1001 * ida_remove - remove the given ID
1002 * @ida: ida handle
1003 * @id: ID to free
1004 */
1005void ida_remove(struct ida *ida, int id)
1006{
1007 struct idr_layer *p = ida->idr.top;
1008 int shift = (ida->idr.layers - 1) * IDR_BITS;
1009 int idr_id = id / IDA_BITMAP_BITS;
1010 int offset = id % IDA_BITMAP_BITS;
1011 int n;
1012 struct ida_bitmap *bitmap;
1013
1014 /* clear full bits while looking up the leaf idr_layer */
1015 while ((shift > 0) && p) {
1016 n = (idr_id >> shift) & IDR_MASK;
1017 __clear_bit(n, &p->bitmap);
1018 p = p->ary[n];
1019 shift -= IDR_BITS;
1020 }
1021
1022 if (p == NULL)
1023 goto err;
1024
1025 n = idr_id & IDR_MASK;
1026 __clear_bit(n, &p->bitmap);
1027
1028 bitmap = (void *)p->ary[n];
1029 if (!test_bit(offset, bitmap->bitmap))
1030 goto err;
1031
1032 /* update bitmap and remove it if empty */
1033 __clear_bit(offset, bitmap->bitmap);
1034 if (--bitmap->nr_busy == 0) {
1035 __set_bit(n, &p->bitmap); /* to please idr_remove() */
1036 idr_remove(&ida->idr, idr_id);
1037 free_bitmap(ida, bitmap);
1038 }
1039
1040 return;
1041
1042 err:
1043 printk(KERN_WARNING
1044 "ida_remove called for id=%d which is not allocated.\n", id);
1045}
1046EXPORT_SYMBOL(ida_remove);
1047
1048/**
1049 * ida_destroy - release all cached layers within an ida tree
ea24ea85 1050 * @ida: ida handle
72dba584
TH
1051 */
1052void ida_destroy(struct ida *ida)
1053{
1054 idr_destroy(&ida->idr);
1055 kfree(ida->free_bitmap);
1056}
1057EXPORT_SYMBOL(ida_destroy);
1058
88eca020
RR
1059/**
1060 * ida_simple_get - get a new id.
1061 * @ida: the (initialized) ida.
1062 * @start: the minimum id (inclusive, < 0x8000000)
1063 * @end: the maximum id (exclusive, < 0x8000000 or 0)
1064 * @gfp_mask: memory allocation flags
1065 *
1066 * Allocates an id in the range start <= id < end, or returns -ENOSPC.
1067 * On memory allocation failure, returns -ENOMEM.
1068 *
1069 * Use ida_simple_remove() to get rid of an id.
1070 */
1071int ida_simple_get(struct ida *ida, unsigned int start, unsigned int end,
1072 gfp_t gfp_mask)
1073{
1074 int ret, id;
1075 unsigned int max;
46cbc1d3 1076 unsigned long flags;
88eca020
RR
1077
1078 BUG_ON((int)start < 0);
1079 BUG_ON((int)end < 0);
1080
1081 if (end == 0)
1082 max = 0x80000000;
1083 else {
1084 BUG_ON(end < start);
1085 max = end - 1;
1086 }
1087
1088again:
1089 if (!ida_pre_get(ida, gfp_mask))
1090 return -ENOMEM;
1091
46cbc1d3 1092 spin_lock_irqsave(&simple_ida_lock, flags);
88eca020
RR
1093 ret = ida_get_new_above(ida, start, &id);
1094 if (!ret) {
1095 if (id > max) {
1096 ida_remove(ida, id);
1097 ret = -ENOSPC;
1098 } else {
1099 ret = id;
1100 }
1101 }
46cbc1d3 1102 spin_unlock_irqrestore(&simple_ida_lock, flags);
88eca020
RR
1103
1104 if (unlikely(ret == -EAGAIN))
1105 goto again;
1106
1107 return ret;
1108}
1109EXPORT_SYMBOL(ida_simple_get);
1110
1111/**
1112 * ida_simple_remove - remove an allocated id.
1113 * @ida: the (initialized) ida.
1114 * @id: the id returned by ida_simple_get.
1115 */
1116void ida_simple_remove(struct ida *ida, unsigned int id)
1117{
46cbc1d3
TH
1118 unsigned long flags;
1119
88eca020 1120 BUG_ON((int)id < 0);
46cbc1d3 1121 spin_lock_irqsave(&simple_ida_lock, flags);
88eca020 1122 ida_remove(ida, id);
46cbc1d3 1123 spin_unlock_irqrestore(&simple_ida_lock, flags);
88eca020
RR
1124}
1125EXPORT_SYMBOL(ida_simple_remove);
1126
72dba584
TH
1127/**
1128 * ida_init - initialize ida handle
1129 * @ida: ida handle
1130 *
1131 * This function is use to set up the handle (@ida) that you will pass
1132 * to the rest of the functions.
1133 */
1134void ida_init(struct ida *ida)
1135{
1136 memset(ida, 0, sizeof(struct ida));
1137 idr_init(&ida->idr);
1138
1139}
1140EXPORT_SYMBOL(ida_init);