1 // SPDX-License-Identifier: GPL-2.0-only
3 * Copyright (C) 2012 Red Hat, Inc.
5 * This file is released under the GPL.
9 #include "dm-bio-prison-v1.h"
10 #include "dm-bio-prison-v2.h"
12 #include <linux/spinlock.h>
13 #include <linux/mempool.h>
14 #include <linux/module.h>
15 #include <linux/slab.h>
17 /*----------------------------------------------------------------*/
19 #define MIN_CELLS 1024
21 struct prison_region {
24 } ____cacheline_aligned_in_smp;
26 struct dm_bio_prison {
28 unsigned int num_locks;
29 struct prison_region regions[];
32 static struct kmem_cache *_cell_cache;
34 /*----------------------------------------------------------------*/
37 * @nr_cells should be the number of cells you want in use _concurrently_.
38 * Don't confuse it with the number of distinct keys.
40 struct dm_bio_prison *dm_bio_prison_create(void)
43 unsigned int i, num_locks;
44 struct dm_bio_prison *prison;
46 num_locks = dm_num_hash_locks();
47 prison = kzalloc(struct_size(prison, regions, num_locks), GFP_KERNEL);
50 prison->num_locks = num_locks;
52 for (i = 0; i < prison->num_locks; i++) {
53 spin_lock_init(&prison->regions[i].lock);
54 prison->regions[i].cell = RB_ROOT;
57 ret = mempool_init_slab_pool(&prison->cell_pool, MIN_CELLS, _cell_cache);
65 EXPORT_SYMBOL_GPL(dm_bio_prison_create);
67 void dm_bio_prison_destroy(struct dm_bio_prison *prison)
69 mempool_exit(&prison->cell_pool);
72 EXPORT_SYMBOL_GPL(dm_bio_prison_destroy);
74 struct dm_bio_prison_cell *dm_bio_prison_alloc_cell(struct dm_bio_prison *prison, gfp_t gfp)
76 return mempool_alloc(&prison->cell_pool, gfp);
78 EXPORT_SYMBOL_GPL(dm_bio_prison_alloc_cell);
80 void dm_bio_prison_free_cell(struct dm_bio_prison *prison,
81 struct dm_bio_prison_cell *cell)
83 mempool_free(cell, &prison->cell_pool);
85 EXPORT_SYMBOL_GPL(dm_bio_prison_free_cell);
87 static void __setup_new_cell(struct dm_cell_key *key,
89 struct dm_bio_prison_cell *cell)
91 memcpy(&cell->key, key, sizeof(cell->key));
92 cell->holder = holder;
93 bio_list_init(&cell->bios);
96 static int cmp_keys(struct dm_cell_key *lhs,
97 struct dm_cell_key *rhs)
99 if (lhs->virtual < rhs->virtual)
102 if (lhs->virtual > rhs->virtual)
105 if (lhs->dev < rhs->dev)
108 if (lhs->dev > rhs->dev)
111 if (lhs->block_end <= rhs->block_begin)
114 if (lhs->block_begin >= rhs->block_end)
120 static unsigned lock_nr(struct dm_cell_key *key, unsigned int num_locks)
122 return (key->block_begin >> BIO_PRISON_MAX_RANGE_SHIFT) & (num_locks - 1);
125 bool dm_cell_key_has_valid_range(struct dm_cell_key *key)
127 if (WARN_ON_ONCE(key->block_end - key->block_begin > BIO_PRISON_MAX_RANGE))
129 if (WARN_ON_ONCE((key->block_begin >> BIO_PRISON_MAX_RANGE_SHIFT) !=
130 (key->block_end - 1) >> BIO_PRISON_MAX_RANGE_SHIFT))
135 EXPORT_SYMBOL(dm_cell_key_has_valid_range);
137 static int __bio_detain(struct rb_root *root,
138 struct dm_cell_key *key,
140 struct dm_bio_prison_cell *cell_prealloc,
141 struct dm_bio_prison_cell **cell_result)
144 struct rb_node **new = &root->rb_node, *parent = NULL;
147 struct dm_bio_prison_cell *cell =
148 rb_entry(*new, struct dm_bio_prison_cell, node);
150 r = cmp_keys(key, &cell->key);
154 new = &((*new)->rb_left);
156 new = &((*new)->rb_right);
159 bio_list_add(&cell->bios, inmate);
165 __setup_new_cell(key, inmate, cell_prealloc);
166 *cell_result = cell_prealloc;
168 rb_link_node(&cell_prealloc->node, parent, new);
169 rb_insert_color(&cell_prealloc->node, root);
174 static int bio_detain(struct dm_bio_prison *prison,
175 struct dm_cell_key *key,
177 struct dm_bio_prison_cell *cell_prealloc,
178 struct dm_bio_prison_cell **cell_result)
181 unsigned l = lock_nr(key, prison->num_locks);
183 spin_lock_irq(&prison->regions[l].lock);
184 r = __bio_detain(&prison->regions[l].cell, key, inmate, cell_prealloc, cell_result);
185 spin_unlock_irq(&prison->regions[l].lock);
190 int dm_bio_detain(struct dm_bio_prison *prison,
191 struct dm_cell_key *key,
193 struct dm_bio_prison_cell *cell_prealloc,
194 struct dm_bio_prison_cell **cell_result)
196 return bio_detain(prison, key, inmate, cell_prealloc, cell_result);
198 EXPORT_SYMBOL_GPL(dm_bio_detain);
200 int dm_get_cell(struct dm_bio_prison *prison,
201 struct dm_cell_key *key,
202 struct dm_bio_prison_cell *cell_prealloc,
203 struct dm_bio_prison_cell **cell_result)
205 return bio_detain(prison, key, NULL, cell_prealloc, cell_result);
207 EXPORT_SYMBOL_GPL(dm_get_cell);
210 * @inmates must have been initialised prior to this call
212 static void __cell_release(struct rb_root *root,
213 struct dm_bio_prison_cell *cell,
214 struct bio_list *inmates)
216 rb_erase(&cell->node, root);
220 bio_list_add(inmates, cell->holder);
221 bio_list_merge(inmates, &cell->bios);
225 void dm_cell_release(struct dm_bio_prison *prison,
226 struct dm_bio_prison_cell *cell,
227 struct bio_list *bios)
229 unsigned l = lock_nr(&cell->key, prison->num_locks);
231 spin_lock_irq(&prison->regions[l].lock);
232 __cell_release(&prison->regions[l].cell, cell, bios);
233 spin_unlock_irq(&prison->regions[l].lock);
235 EXPORT_SYMBOL_GPL(dm_cell_release);
238 * Sometimes we don't want the holder, just the additional bios.
240 static void __cell_release_no_holder(struct rb_root *root,
241 struct dm_bio_prison_cell *cell,
242 struct bio_list *inmates)
244 rb_erase(&cell->node, root);
245 bio_list_merge(inmates, &cell->bios);
248 void dm_cell_release_no_holder(struct dm_bio_prison *prison,
249 struct dm_bio_prison_cell *cell,
250 struct bio_list *inmates)
252 unsigned l = lock_nr(&cell->key, prison->num_locks);
255 spin_lock_irqsave(&prison->regions[l].lock, flags);
256 __cell_release_no_holder(&prison->regions[l].cell, cell, inmates);
257 spin_unlock_irqrestore(&prison->regions[l].lock, flags);
259 EXPORT_SYMBOL_GPL(dm_cell_release_no_holder);
261 void dm_cell_error(struct dm_bio_prison *prison,
262 struct dm_bio_prison_cell *cell, blk_status_t error)
264 struct bio_list bios;
267 bio_list_init(&bios);
268 dm_cell_release(prison, cell, &bios);
270 while ((bio = bio_list_pop(&bios))) {
271 bio->bi_status = error;
275 EXPORT_SYMBOL_GPL(dm_cell_error);
277 void dm_cell_visit_release(struct dm_bio_prison *prison,
278 void (*visit_fn)(void *, struct dm_bio_prison_cell *),
280 struct dm_bio_prison_cell *cell)
282 unsigned l = lock_nr(&cell->key, prison->num_locks);
283 spin_lock_irq(&prison->regions[l].lock);
284 visit_fn(context, cell);
285 rb_erase(&cell->node, &prison->regions[l].cell);
286 spin_unlock_irq(&prison->regions[l].lock);
288 EXPORT_SYMBOL_GPL(dm_cell_visit_release);
290 static int __promote_or_release(struct rb_root *root,
291 struct dm_bio_prison_cell *cell)
293 if (bio_list_empty(&cell->bios)) {
294 rb_erase(&cell->node, root);
298 cell->holder = bio_list_pop(&cell->bios);
302 int dm_cell_promote_or_release(struct dm_bio_prison *prison,
303 struct dm_bio_prison_cell *cell)
306 unsigned l = lock_nr(&cell->key, prison->num_locks);
308 spin_lock_irq(&prison->regions[l].lock);
309 r = __promote_or_release(&prison->regions[l].cell, cell);
310 spin_unlock_irq(&prison->regions[l].lock);
314 EXPORT_SYMBOL_GPL(dm_cell_promote_or_release);
316 /*----------------------------------------------------------------*/
318 #define DEFERRED_SET_SIZE 64
320 struct dm_deferred_entry {
321 struct dm_deferred_set *ds;
323 struct list_head work_items;
326 struct dm_deferred_set {
328 unsigned int current_entry;
329 unsigned int sweeper;
330 struct dm_deferred_entry entries[DEFERRED_SET_SIZE];
333 struct dm_deferred_set *dm_deferred_set_create(void)
336 struct dm_deferred_set *ds;
338 ds = kmalloc(sizeof(*ds), GFP_KERNEL);
342 spin_lock_init(&ds->lock);
343 ds->current_entry = 0;
345 for (i = 0; i < DEFERRED_SET_SIZE; i++) {
346 ds->entries[i].ds = ds;
347 ds->entries[i].count = 0;
348 INIT_LIST_HEAD(&ds->entries[i].work_items);
353 EXPORT_SYMBOL_GPL(dm_deferred_set_create);
355 void dm_deferred_set_destroy(struct dm_deferred_set *ds)
359 EXPORT_SYMBOL_GPL(dm_deferred_set_destroy);
361 struct dm_deferred_entry *dm_deferred_entry_inc(struct dm_deferred_set *ds)
364 struct dm_deferred_entry *entry;
366 spin_lock_irqsave(&ds->lock, flags);
367 entry = ds->entries + ds->current_entry;
369 spin_unlock_irqrestore(&ds->lock, flags);
373 EXPORT_SYMBOL_GPL(dm_deferred_entry_inc);
375 static unsigned int ds_next(unsigned int index)
377 return (index + 1) % DEFERRED_SET_SIZE;
380 static void __sweep(struct dm_deferred_set *ds, struct list_head *head)
382 while ((ds->sweeper != ds->current_entry) &&
383 !ds->entries[ds->sweeper].count) {
384 list_splice_init(&ds->entries[ds->sweeper].work_items, head);
385 ds->sweeper = ds_next(ds->sweeper);
388 if ((ds->sweeper == ds->current_entry) && !ds->entries[ds->sweeper].count)
389 list_splice_init(&ds->entries[ds->sweeper].work_items, head);
392 void dm_deferred_entry_dec(struct dm_deferred_entry *entry, struct list_head *head)
396 spin_lock_irqsave(&entry->ds->lock, flags);
397 BUG_ON(!entry->count);
399 __sweep(entry->ds, head);
400 spin_unlock_irqrestore(&entry->ds->lock, flags);
402 EXPORT_SYMBOL_GPL(dm_deferred_entry_dec);
405 * Returns 1 if deferred or 0 if no pending items to delay job.
407 int dm_deferred_set_add_work(struct dm_deferred_set *ds, struct list_head *work)
410 unsigned int next_entry;
412 spin_lock_irq(&ds->lock);
413 if ((ds->sweeper == ds->current_entry) &&
414 !ds->entries[ds->current_entry].count)
417 list_add(work, &ds->entries[ds->current_entry].work_items);
418 next_entry = ds_next(ds->current_entry);
419 if (!ds->entries[next_entry].count)
420 ds->current_entry = next_entry;
422 spin_unlock_irq(&ds->lock);
426 EXPORT_SYMBOL_GPL(dm_deferred_set_add_work);
428 /*----------------------------------------------------------------*/
430 static int __init dm_bio_prison_init_v1(void)
432 _cell_cache = KMEM_CACHE(dm_bio_prison_cell, 0);
439 static void dm_bio_prison_exit_v1(void)
441 kmem_cache_destroy(_cell_cache);
445 static int (*_inits[])(void) __initdata = {
446 dm_bio_prison_init_v1,
447 dm_bio_prison_init_v2,
450 static void (*_exits[])(void) = {
451 dm_bio_prison_exit_v1,
452 dm_bio_prison_exit_v2,
455 static int __init dm_bio_prison_init(void)
457 const int count = ARRAY_SIZE(_inits);
461 for (i = 0; i < count; i++) {
476 static void __exit dm_bio_prison_exit(void)
478 int i = ARRAY_SIZE(_exits);
487 module_init(dm_bio_prison_init);
488 module_exit(dm_bio_prison_exit);
490 MODULE_DESCRIPTION(DM_NAME " bio prison");
491 MODULE_AUTHOR("Joe Thornber <dm-devel@redhat.com>");
492 MODULE_LICENSE("GPL");