dm-bio-prison-v1.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458
  1. /*
  2. * Copyright (C) 2012 Red Hat, Inc.
  3. *
  4. * This file is released under the GPL.
  5. */
  6. #include "dm.h"
  7. #include "dm-bio-prison-v1.h"
  8. #include "dm-bio-prison-v2.h"
  9. #include <linux/spinlock.h>
  10. #include <linux/mempool.h>
  11. #include <linux/module.h>
  12. #include <linux/slab.h>
  13. /*----------------------------------------------------------------*/
  14. #define MIN_CELLS 1024
  15. struct dm_bio_prison {
  16. spinlock_t lock;
  17. struct rb_root cells;
  18. mempool_t cell_pool;
  19. };
  20. static struct kmem_cache *_cell_cache;
  21. /*----------------------------------------------------------------*/
  22. /*
  23. * @nr_cells should be the number of cells you want in use _concurrently_.
  24. * Don't confuse it with the number of distinct keys.
  25. */
  26. struct dm_bio_prison *dm_bio_prison_create(void)
  27. {
  28. struct dm_bio_prison *prison = kzalloc(sizeof(*prison), GFP_KERNEL);
  29. int ret;
  30. if (!prison)
  31. return NULL;
  32. spin_lock_init(&prison->lock);
  33. ret = mempool_init_slab_pool(&prison->cell_pool, MIN_CELLS, _cell_cache);
  34. if (ret) {
  35. kfree(prison);
  36. return NULL;
  37. }
  38. prison->cells = RB_ROOT;
  39. return prison;
  40. }
  41. EXPORT_SYMBOL_GPL(dm_bio_prison_create);
  42. void dm_bio_prison_destroy(struct dm_bio_prison *prison)
  43. {
  44. mempool_exit(&prison->cell_pool);
  45. kfree(prison);
  46. }
  47. EXPORT_SYMBOL_GPL(dm_bio_prison_destroy);
  48. struct dm_bio_prison_cell *dm_bio_prison_alloc_cell(struct dm_bio_prison *prison, gfp_t gfp)
  49. {
  50. return mempool_alloc(&prison->cell_pool, gfp);
  51. }
  52. EXPORT_SYMBOL_GPL(dm_bio_prison_alloc_cell);
  53. void dm_bio_prison_free_cell(struct dm_bio_prison *prison,
  54. struct dm_bio_prison_cell *cell)
  55. {
  56. mempool_free(cell, &prison->cell_pool);
  57. }
  58. EXPORT_SYMBOL_GPL(dm_bio_prison_free_cell);
  59. static void __setup_new_cell(struct dm_cell_key *key,
  60. struct bio *holder,
  61. struct dm_bio_prison_cell *cell)
  62. {
  63. memcpy(&cell->key, key, sizeof(cell->key));
  64. cell->holder = holder;
  65. bio_list_init(&cell->bios);
  66. }
  67. static int cmp_keys(struct dm_cell_key *lhs,
  68. struct dm_cell_key *rhs)
  69. {
  70. if (lhs->virtual < rhs->virtual)
  71. return -1;
  72. if (lhs->virtual > rhs->virtual)
  73. return 1;
  74. if (lhs->dev < rhs->dev)
  75. return -1;
  76. if (lhs->dev > rhs->dev)
  77. return 1;
  78. if (lhs->block_end <= rhs->block_begin)
  79. return -1;
  80. if (lhs->block_begin >= rhs->block_end)
  81. return 1;
  82. return 0;
  83. }
  84. static int __bio_detain(struct dm_bio_prison *prison,
  85. struct dm_cell_key *key,
  86. struct bio *inmate,
  87. struct dm_bio_prison_cell *cell_prealloc,
  88. struct dm_bio_prison_cell **cell_result)
  89. {
  90. int r;
  91. struct rb_node **new = &prison->cells.rb_node, *parent = NULL;
  92. while (*new) {
  93. struct dm_bio_prison_cell *cell =
  94. rb_entry(*new, struct dm_bio_prison_cell, node);
  95. r = cmp_keys(key, &cell->key);
  96. parent = *new;
  97. if (r < 0)
  98. new = &((*new)->rb_left);
  99. else if (r > 0)
  100. new = &((*new)->rb_right);
  101. else {
  102. if (inmate)
  103. bio_list_add(&cell->bios, inmate);
  104. *cell_result = cell;
  105. return 1;
  106. }
  107. }
  108. __setup_new_cell(key, inmate, cell_prealloc);
  109. *cell_result = cell_prealloc;
  110. rb_link_node(&cell_prealloc->node, parent, new);
  111. rb_insert_color(&cell_prealloc->node, &prison->cells);
  112. return 0;
  113. }
  114. static int bio_detain(struct dm_bio_prison *prison,
  115. struct dm_cell_key *key,
  116. struct bio *inmate,
  117. struct dm_bio_prison_cell *cell_prealloc,
  118. struct dm_bio_prison_cell **cell_result)
  119. {
  120. int r;
  121. spin_lock_irq(&prison->lock);
  122. r = __bio_detain(prison, key, inmate, cell_prealloc, cell_result);
  123. spin_unlock_irq(&prison->lock);
  124. return r;
  125. }
  126. int dm_bio_detain(struct dm_bio_prison *prison,
  127. struct dm_cell_key *key,
  128. struct bio *inmate,
  129. struct dm_bio_prison_cell *cell_prealloc,
  130. struct dm_bio_prison_cell **cell_result)
  131. {
  132. return bio_detain(prison, key, inmate, cell_prealloc, cell_result);
  133. }
  134. EXPORT_SYMBOL_GPL(dm_bio_detain);
  135. int dm_get_cell(struct dm_bio_prison *prison,
  136. struct dm_cell_key *key,
  137. struct dm_bio_prison_cell *cell_prealloc,
  138. struct dm_bio_prison_cell **cell_result)
  139. {
  140. return bio_detain(prison, key, NULL, cell_prealloc, cell_result);
  141. }
  142. EXPORT_SYMBOL_GPL(dm_get_cell);
  143. /*
  144. * @inmates must have been initialised prior to this call
  145. */
  146. static void __cell_release(struct dm_bio_prison *prison,
  147. struct dm_bio_prison_cell *cell,
  148. struct bio_list *inmates)
  149. {
  150. rb_erase(&cell->node, &prison->cells);
  151. if (inmates) {
  152. if (cell->holder)
  153. bio_list_add(inmates, cell->holder);
  154. bio_list_merge(inmates, &cell->bios);
  155. }
  156. }
  157. void dm_cell_release(struct dm_bio_prison *prison,
  158. struct dm_bio_prison_cell *cell,
  159. struct bio_list *bios)
  160. {
  161. spin_lock_irq(&prison->lock);
  162. __cell_release(prison, cell, bios);
  163. spin_unlock_irq(&prison->lock);
  164. }
  165. EXPORT_SYMBOL_GPL(dm_cell_release);
  166. /*
  167. * Sometimes we don't want the holder, just the additional bios.
  168. */
  169. static void __cell_release_no_holder(struct dm_bio_prison *prison,
  170. struct dm_bio_prison_cell *cell,
  171. struct bio_list *inmates)
  172. {
  173. rb_erase(&cell->node, &prison->cells);
  174. bio_list_merge(inmates, &cell->bios);
  175. }
  176. void dm_cell_release_no_holder(struct dm_bio_prison *prison,
  177. struct dm_bio_prison_cell *cell,
  178. struct bio_list *inmates)
  179. {
  180. unsigned long flags;
  181. spin_lock_irqsave(&prison->lock, flags);
  182. __cell_release_no_holder(prison, cell, inmates);
  183. spin_unlock_irqrestore(&prison->lock, flags);
  184. }
  185. EXPORT_SYMBOL_GPL(dm_cell_release_no_holder);
  186. void dm_cell_error(struct dm_bio_prison *prison,
  187. struct dm_bio_prison_cell *cell, blk_status_t error)
  188. {
  189. struct bio_list bios;
  190. struct bio *bio;
  191. bio_list_init(&bios);
  192. dm_cell_release(prison, cell, &bios);
  193. while ((bio = bio_list_pop(&bios))) {
  194. bio->bi_status = error;
  195. bio_endio(bio);
  196. }
  197. }
  198. EXPORT_SYMBOL_GPL(dm_cell_error);
  199. void dm_cell_visit_release(struct dm_bio_prison *prison,
  200. void (*visit_fn)(void *, struct dm_bio_prison_cell *),
  201. void *context,
  202. struct dm_bio_prison_cell *cell)
  203. {
  204. spin_lock_irq(&prison->lock);
  205. visit_fn(context, cell);
  206. rb_erase(&cell->node, &prison->cells);
  207. spin_unlock_irq(&prison->lock);
  208. }
  209. EXPORT_SYMBOL_GPL(dm_cell_visit_release);
  210. static int __promote_or_release(struct dm_bio_prison *prison,
  211. struct dm_bio_prison_cell *cell)
  212. {
  213. if (bio_list_empty(&cell->bios)) {
  214. rb_erase(&cell->node, &prison->cells);
  215. return 1;
  216. }
  217. cell->holder = bio_list_pop(&cell->bios);
  218. return 0;
  219. }
  220. int dm_cell_promote_or_release(struct dm_bio_prison *prison,
  221. struct dm_bio_prison_cell *cell)
  222. {
  223. int r;
  224. spin_lock_irq(&prison->lock);
  225. r = __promote_or_release(prison, cell);
  226. spin_unlock_irq(&prison->lock);
  227. return r;
  228. }
  229. EXPORT_SYMBOL_GPL(dm_cell_promote_or_release);
  230. /*----------------------------------------------------------------*/
  231. #define DEFERRED_SET_SIZE 64
  232. struct dm_deferred_entry {
  233. struct dm_deferred_set *ds;
  234. unsigned int count;
  235. struct list_head work_items;
  236. };
  237. struct dm_deferred_set {
  238. spinlock_t lock;
  239. unsigned int current_entry;
  240. unsigned int sweeper;
  241. struct dm_deferred_entry entries[DEFERRED_SET_SIZE];
  242. };
  243. struct dm_deferred_set *dm_deferred_set_create(void)
  244. {
  245. int i;
  246. struct dm_deferred_set *ds;
  247. ds = kmalloc(sizeof(*ds), GFP_KERNEL);
  248. if (!ds)
  249. return NULL;
  250. spin_lock_init(&ds->lock);
  251. ds->current_entry = 0;
  252. ds->sweeper = 0;
  253. for (i = 0; i < DEFERRED_SET_SIZE; i++) {
  254. ds->entries[i].ds = ds;
  255. ds->entries[i].count = 0;
  256. INIT_LIST_HEAD(&ds->entries[i].work_items);
  257. }
  258. return ds;
  259. }
  260. EXPORT_SYMBOL_GPL(dm_deferred_set_create);
  261. void dm_deferred_set_destroy(struct dm_deferred_set *ds)
  262. {
  263. kfree(ds);
  264. }
  265. EXPORT_SYMBOL_GPL(dm_deferred_set_destroy);
  266. struct dm_deferred_entry *dm_deferred_entry_inc(struct dm_deferred_set *ds)
  267. {
  268. unsigned long flags;
  269. struct dm_deferred_entry *entry;
  270. spin_lock_irqsave(&ds->lock, flags);
  271. entry = ds->entries + ds->current_entry;
  272. entry->count++;
  273. spin_unlock_irqrestore(&ds->lock, flags);
  274. return entry;
  275. }
  276. EXPORT_SYMBOL_GPL(dm_deferred_entry_inc);
  277. static unsigned int ds_next(unsigned int index)
  278. {
  279. return (index + 1) % DEFERRED_SET_SIZE;
  280. }
  281. static void __sweep(struct dm_deferred_set *ds, struct list_head *head)
  282. {
  283. while ((ds->sweeper != ds->current_entry) &&
  284. !ds->entries[ds->sweeper].count) {
  285. list_splice_init(&ds->entries[ds->sweeper].work_items, head);
  286. ds->sweeper = ds_next(ds->sweeper);
  287. }
  288. if ((ds->sweeper == ds->current_entry) && !ds->entries[ds->sweeper].count)
  289. list_splice_init(&ds->entries[ds->sweeper].work_items, head);
  290. }
  291. void dm_deferred_entry_dec(struct dm_deferred_entry *entry, struct list_head *head)
  292. {
  293. unsigned long flags;
  294. spin_lock_irqsave(&entry->ds->lock, flags);
  295. BUG_ON(!entry->count);
  296. --entry->count;
  297. __sweep(entry->ds, head);
  298. spin_unlock_irqrestore(&entry->ds->lock, flags);
  299. }
  300. EXPORT_SYMBOL_GPL(dm_deferred_entry_dec);
  301. /*
  302. * Returns 1 if deferred or 0 if no pending items to delay job.
  303. */
  304. int dm_deferred_set_add_work(struct dm_deferred_set *ds, struct list_head *work)
  305. {
  306. int r = 1;
  307. unsigned int next_entry;
  308. spin_lock_irq(&ds->lock);
  309. if ((ds->sweeper == ds->current_entry) &&
  310. !ds->entries[ds->current_entry].count)
  311. r = 0;
  312. else {
  313. list_add(work, &ds->entries[ds->current_entry].work_items);
  314. next_entry = ds_next(ds->current_entry);
  315. if (!ds->entries[next_entry].count)
  316. ds->current_entry = next_entry;
  317. }
  318. spin_unlock_irq(&ds->lock);
  319. return r;
  320. }
  321. EXPORT_SYMBOL_GPL(dm_deferred_set_add_work);
  322. /*----------------------------------------------------------------*/
  323. static int __init dm_bio_prison_init_v1(void)
  324. {
  325. _cell_cache = KMEM_CACHE(dm_bio_prison_cell, 0);
  326. if (!_cell_cache)
  327. return -ENOMEM;
  328. return 0;
  329. }
  330. static void dm_bio_prison_exit_v1(void)
  331. {
  332. kmem_cache_destroy(_cell_cache);
  333. _cell_cache = NULL;
  334. }
  335. static int (*_inits[])(void) __initdata = {
  336. dm_bio_prison_init_v1,
  337. dm_bio_prison_init_v2,
  338. };
  339. static void (*_exits[])(void) = {
  340. dm_bio_prison_exit_v1,
  341. dm_bio_prison_exit_v2,
  342. };
  343. static int __init dm_bio_prison_init(void)
  344. {
  345. const int count = ARRAY_SIZE(_inits);
  346. int r, i;
  347. for (i = 0; i < count; i++) {
  348. r = _inits[i]();
  349. if (r)
  350. goto bad;
  351. }
  352. return 0;
  353. bad:
  354. while (i--)
  355. _exits[i]();
  356. return r;
  357. }
  358. static void __exit dm_bio_prison_exit(void)
  359. {
  360. int i = ARRAY_SIZE(_exits);
  361. while (i--)
  362. _exits[i]();
  363. }
  364. /*
  365. * module hooks
  366. */
  367. module_init(dm_bio_prison_init);
  368. module_exit(dm_bio_prison_exit);
  369. MODULE_DESCRIPTION(DM_NAME " bio prison");
  370. MODULE_AUTHOR("Joe Thornber <[email protected]>");
  371. MODULE_LICENSE("GPL");