dm-bio-prison-v1.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (C) 2012 Red Hat, Inc.
  4. *
  5. * This file is released under the GPL.
  6. */
  7. #include "dm.h"
  8. #include "dm-bio-prison-v1.h"
  9. #include "dm-bio-prison-v2.h"
  10. #include <linux/spinlock.h>
  11. #include <linux/mempool.h>
  12. #include <linux/module.h>
  13. #include <linux/slab.h>
  14. /*----------------------------------------------------------------*/
  15. #define MIN_CELLS 1024
  16. struct prison_region {
  17. spinlock_t lock;
  18. struct rb_root cell;
  19. } ____cacheline_aligned_in_smp;
  20. struct dm_bio_prison {
  21. mempool_t cell_pool;
  22. unsigned int num_locks;
  23. struct prison_region regions[] __counted_by(num_locks);
  24. };
  25. static struct kmem_cache *_cell_cache;
  26. /*----------------------------------------------------------------*/
  27. /*
  28. * @nr_cells should be the number of cells you want in use _concurrently_.
  29. * Don't confuse it with the number of distinct keys.
  30. */
  31. struct dm_bio_prison *dm_bio_prison_create(void)
  32. {
  33. int ret;
  34. unsigned int i, num_locks;
  35. struct dm_bio_prison *prison;
  36. num_locks = dm_num_hash_locks();
  37. prison = kzalloc_flex(*prison, regions, num_locks);
  38. if (!prison)
  39. return NULL;
  40. prison->num_locks = num_locks;
  41. for (i = 0; i < prison->num_locks; i++) {
  42. spin_lock_init(&prison->regions[i].lock);
  43. prison->regions[i].cell = RB_ROOT;
  44. }
  45. ret = mempool_init_slab_pool(&prison->cell_pool, MIN_CELLS, _cell_cache);
  46. if (ret) {
  47. kfree(prison);
  48. return NULL;
  49. }
  50. return prison;
  51. }
  52. EXPORT_SYMBOL_GPL(dm_bio_prison_create);
  53. void dm_bio_prison_destroy(struct dm_bio_prison *prison)
  54. {
  55. mempool_exit(&prison->cell_pool);
  56. kfree(prison);
  57. }
  58. EXPORT_SYMBOL_GPL(dm_bio_prison_destroy);
  59. struct dm_bio_prison_cell *dm_bio_prison_alloc_cell(struct dm_bio_prison *prison, gfp_t gfp)
  60. {
  61. return mempool_alloc(&prison->cell_pool, gfp);
  62. }
  63. EXPORT_SYMBOL_GPL(dm_bio_prison_alloc_cell);
  64. void dm_bio_prison_free_cell(struct dm_bio_prison *prison,
  65. struct dm_bio_prison_cell *cell)
  66. {
  67. mempool_free(cell, &prison->cell_pool);
  68. }
  69. EXPORT_SYMBOL_GPL(dm_bio_prison_free_cell);
  70. static void __setup_new_cell(struct dm_cell_key *key,
  71. struct bio *holder,
  72. struct dm_bio_prison_cell *cell)
  73. {
  74. memcpy(&cell->key, key, sizeof(cell->key));
  75. cell->holder = holder;
  76. bio_list_init(&cell->bios);
  77. }
  78. static int cmp_keys(struct dm_cell_key *lhs,
  79. struct dm_cell_key *rhs)
  80. {
  81. if (lhs->virtual < rhs->virtual)
  82. return -1;
  83. if (lhs->virtual > rhs->virtual)
  84. return 1;
  85. if (lhs->dev < rhs->dev)
  86. return -1;
  87. if (lhs->dev > rhs->dev)
  88. return 1;
  89. if (lhs->block_end <= rhs->block_begin)
  90. return -1;
  91. if (lhs->block_begin >= rhs->block_end)
  92. return 1;
  93. return 0;
  94. }
  95. static inline unsigned int lock_nr(struct dm_cell_key *key, unsigned int num_locks)
  96. {
  97. return dm_hash_locks_index((key->block_begin >> BIO_PRISON_MAX_RANGE_SHIFT),
  98. num_locks);
  99. }
  100. bool dm_cell_key_has_valid_range(struct dm_cell_key *key)
  101. {
  102. if (WARN_ON_ONCE(key->block_end - key->block_begin > BIO_PRISON_MAX_RANGE))
  103. return false;
  104. if (WARN_ON_ONCE((key->block_begin >> BIO_PRISON_MAX_RANGE_SHIFT) !=
  105. (key->block_end - 1) >> BIO_PRISON_MAX_RANGE_SHIFT))
  106. return false;
  107. return true;
  108. }
  109. EXPORT_SYMBOL(dm_cell_key_has_valid_range);
  110. static int __bio_detain(struct rb_root *root,
  111. struct dm_cell_key *key,
  112. struct bio *inmate,
  113. struct dm_bio_prison_cell *cell_prealloc,
  114. struct dm_bio_prison_cell **cell_result)
  115. {
  116. int r;
  117. struct rb_node **new = &root->rb_node, *parent = NULL;
  118. while (*new) {
  119. struct dm_bio_prison_cell *cell =
  120. rb_entry(*new, struct dm_bio_prison_cell, node);
  121. r = cmp_keys(key, &cell->key);
  122. parent = *new;
  123. if (r < 0)
  124. new = &((*new)->rb_left);
  125. else if (r > 0)
  126. new = &((*new)->rb_right);
  127. else {
  128. if (inmate)
  129. bio_list_add(&cell->bios, inmate);
  130. *cell_result = cell;
  131. return 1;
  132. }
  133. }
  134. __setup_new_cell(key, inmate, cell_prealloc);
  135. *cell_result = cell_prealloc;
  136. rb_link_node(&cell_prealloc->node, parent, new);
  137. rb_insert_color(&cell_prealloc->node, root);
  138. return 0;
  139. }
  140. static int bio_detain(struct dm_bio_prison *prison,
  141. struct dm_cell_key *key,
  142. struct bio *inmate,
  143. struct dm_bio_prison_cell *cell_prealloc,
  144. struct dm_bio_prison_cell **cell_result)
  145. {
  146. int r;
  147. unsigned l = lock_nr(key, prison->num_locks);
  148. spin_lock_irq(&prison->regions[l].lock);
  149. r = __bio_detain(&prison->regions[l].cell, key, inmate, cell_prealloc, cell_result);
  150. spin_unlock_irq(&prison->regions[l].lock);
  151. return r;
  152. }
  153. int dm_bio_detain(struct dm_bio_prison *prison,
  154. struct dm_cell_key *key,
  155. struct bio *inmate,
  156. struct dm_bio_prison_cell *cell_prealloc,
  157. struct dm_bio_prison_cell **cell_result)
  158. {
  159. return bio_detain(prison, key, inmate, cell_prealloc, cell_result);
  160. }
  161. EXPORT_SYMBOL_GPL(dm_bio_detain);
  162. /*
  163. * @inmates must have been initialised prior to this call
  164. */
  165. static void __cell_release(struct rb_root *root,
  166. struct dm_bio_prison_cell *cell,
  167. struct bio_list *inmates)
  168. {
  169. rb_erase(&cell->node, root);
  170. if (inmates) {
  171. if (cell->holder)
  172. bio_list_add(inmates, cell->holder);
  173. bio_list_merge(inmates, &cell->bios);
  174. }
  175. }
  176. void dm_cell_release(struct dm_bio_prison *prison,
  177. struct dm_bio_prison_cell *cell,
  178. struct bio_list *bios)
  179. {
  180. unsigned l = lock_nr(&cell->key, prison->num_locks);
  181. spin_lock_irq(&prison->regions[l].lock);
  182. __cell_release(&prison->regions[l].cell, cell, bios);
  183. spin_unlock_irq(&prison->regions[l].lock);
  184. }
  185. EXPORT_SYMBOL_GPL(dm_cell_release);
  186. /*
  187. * Sometimes we don't want the holder, just the additional bios.
  188. */
  189. static void __cell_release_no_holder(struct rb_root *root,
  190. struct dm_bio_prison_cell *cell,
  191. struct bio_list *inmates)
  192. {
  193. rb_erase(&cell->node, root);
  194. bio_list_merge(inmates, &cell->bios);
  195. }
  196. void dm_cell_release_no_holder(struct dm_bio_prison *prison,
  197. struct dm_bio_prison_cell *cell,
  198. struct bio_list *inmates)
  199. {
  200. unsigned l = lock_nr(&cell->key, prison->num_locks);
  201. unsigned long flags;
  202. spin_lock_irqsave(&prison->regions[l].lock, flags);
  203. __cell_release_no_holder(&prison->regions[l].cell, cell, inmates);
  204. spin_unlock_irqrestore(&prison->regions[l].lock, flags);
  205. }
  206. EXPORT_SYMBOL_GPL(dm_cell_release_no_holder);
  207. void dm_cell_error(struct dm_bio_prison *prison,
  208. struct dm_bio_prison_cell *cell, blk_status_t error)
  209. {
  210. struct bio_list bios;
  211. struct bio *bio;
  212. bio_list_init(&bios);
  213. dm_cell_release(prison, cell, &bios);
  214. while ((bio = bio_list_pop(&bios))) {
  215. bio->bi_status = error;
  216. bio_endio(bio);
  217. }
  218. }
  219. EXPORT_SYMBOL_GPL(dm_cell_error);
  220. void dm_cell_visit_release(struct dm_bio_prison *prison,
  221. void (*visit_fn)(void *, struct dm_bio_prison_cell *),
  222. void *context,
  223. struct dm_bio_prison_cell *cell)
  224. {
  225. unsigned l = lock_nr(&cell->key, prison->num_locks);
  226. spin_lock_irq(&prison->regions[l].lock);
  227. visit_fn(context, cell);
  228. rb_erase(&cell->node, &prison->regions[l].cell);
  229. spin_unlock_irq(&prison->regions[l].lock);
  230. }
  231. EXPORT_SYMBOL_GPL(dm_cell_visit_release);
  232. /*----------------------------------------------------------------*/
  233. #define DEFERRED_SET_SIZE 64
  234. struct dm_deferred_entry {
  235. struct dm_deferred_set *ds;
  236. unsigned int count;
  237. struct list_head work_items;
  238. };
  239. struct dm_deferred_set {
  240. spinlock_t lock;
  241. unsigned int current_entry;
  242. unsigned int sweeper;
  243. struct dm_deferred_entry entries[DEFERRED_SET_SIZE];
  244. };
  245. struct dm_deferred_set *dm_deferred_set_create(void)
  246. {
  247. int i;
  248. struct dm_deferred_set *ds;
  249. ds = kmalloc_obj(*ds);
  250. if (!ds)
  251. return NULL;
  252. spin_lock_init(&ds->lock);
  253. ds->current_entry = 0;
  254. ds->sweeper = 0;
  255. for (i = 0; i < DEFERRED_SET_SIZE; i++) {
  256. ds->entries[i].ds = ds;
  257. ds->entries[i].count = 0;
  258. INIT_LIST_HEAD(&ds->entries[i].work_items);
  259. }
  260. return ds;
  261. }
  262. EXPORT_SYMBOL_GPL(dm_deferred_set_create);
  263. void dm_deferred_set_destroy(struct dm_deferred_set *ds)
  264. {
  265. kfree(ds);
  266. }
  267. EXPORT_SYMBOL_GPL(dm_deferred_set_destroy);
  268. struct dm_deferred_entry *dm_deferred_entry_inc(struct dm_deferred_set *ds)
  269. {
  270. unsigned long flags;
  271. struct dm_deferred_entry *entry;
  272. spin_lock_irqsave(&ds->lock, flags);
  273. entry = ds->entries + ds->current_entry;
  274. entry->count++;
  275. spin_unlock_irqrestore(&ds->lock, flags);
  276. return entry;
  277. }
  278. EXPORT_SYMBOL_GPL(dm_deferred_entry_inc);
  279. static unsigned int ds_next(unsigned int index)
  280. {
  281. return (index + 1) % DEFERRED_SET_SIZE;
  282. }
  283. static void __sweep(struct dm_deferred_set *ds, struct list_head *head)
  284. {
  285. while ((ds->sweeper != ds->current_entry) &&
  286. !ds->entries[ds->sweeper].count) {
  287. list_splice_init(&ds->entries[ds->sweeper].work_items, head);
  288. ds->sweeper = ds_next(ds->sweeper);
  289. }
  290. if ((ds->sweeper == ds->current_entry) && !ds->entries[ds->sweeper].count)
  291. list_splice_init(&ds->entries[ds->sweeper].work_items, head);
  292. }
  293. void dm_deferred_entry_dec(struct dm_deferred_entry *entry, struct list_head *head)
  294. {
  295. unsigned long flags;
  296. spin_lock_irqsave(&entry->ds->lock, flags);
  297. BUG_ON(!entry->count);
  298. --entry->count;
  299. __sweep(entry->ds, head);
  300. spin_unlock_irqrestore(&entry->ds->lock, flags);
  301. }
  302. EXPORT_SYMBOL_GPL(dm_deferred_entry_dec);
  303. /*
  304. * Returns 1 if deferred or 0 if no pending items to delay job.
  305. */
  306. int dm_deferred_set_add_work(struct dm_deferred_set *ds, struct list_head *work)
  307. {
  308. int r = 1;
  309. unsigned int next_entry;
  310. spin_lock_irq(&ds->lock);
  311. if ((ds->sweeper == ds->current_entry) &&
  312. !ds->entries[ds->current_entry].count)
  313. r = 0;
  314. else {
  315. list_add(work, &ds->entries[ds->current_entry].work_items);
  316. next_entry = ds_next(ds->current_entry);
  317. if (!ds->entries[next_entry].count)
  318. ds->current_entry = next_entry;
  319. }
  320. spin_unlock_irq(&ds->lock);
  321. return r;
  322. }
  323. EXPORT_SYMBOL_GPL(dm_deferred_set_add_work);
  324. /*----------------------------------------------------------------*/
  325. static int __init dm_bio_prison_init_v1(void)
  326. {
  327. _cell_cache = KMEM_CACHE(dm_bio_prison_cell, 0);
  328. if (!_cell_cache)
  329. return -ENOMEM;
  330. return 0;
  331. }
  332. static void dm_bio_prison_exit_v1(void)
  333. {
  334. kmem_cache_destroy(_cell_cache);
  335. _cell_cache = NULL;
  336. }
  337. static int (*_inits[])(void) __initdata = {
  338. dm_bio_prison_init_v1,
  339. dm_bio_prison_init_v2,
  340. };
  341. static void (*_exits[])(void) = {
  342. dm_bio_prison_exit_v1,
  343. dm_bio_prison_exit_v2,
  344. };
  345. static int __init dm_bio_prison_init(void)
  346. {
  347. const int count = ARRAY_SIZE(_inits);
  348. int r, i;
  349. for (i = 0; i < count; i++) {
  350. r = _inits[i]();
  351. if (r)
  352. goto bad;
  353. }
  354. return 0;
  355. bad:
  356. while (i--)
  357. _exits[i]();
  358. return r;
  359. }
  360. static void __exit dm_bio_prison_exit(void)
  361. {
  362. int i = ARRAY_SIZE(_exits);
  363. while (i--)
  364. _exits[i]();
  365. }
  366. /*
  367. * module hooks
  368. */
  369. module_init(dm_bio_prison_init);
  370. module_exit(dm_bio_prison_exit);
  371. MODULE_DESCRIPTION(DM_NAME " bio prison");
  372. MODULE_AUTHOR("Joe Thornber <dm-devel@lists.linux.dev>");
  373. MODULE_LICENSE("GPL");