elevator.c 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Block device elevator/IO-scheduler.
  4. *
  5. * Copyright (C) 2000 Andrea Arcangeli <[email protected]> SuSE
  6. *
  7. * 30042000 Jens Axboe <[email protected]> :
  8. *
  9. * Split the elevator a bit so that it is possible to choose a different
  10. * one or even write a new "plug in". There are three pieces:
  11. * - elevator_fn, inserts a new request in the queue list
  12. * - elevator_merge_fn, decides whether a new buffer can be merged with
  13. * an existing request
  14. * - elevator_dequeue_fn, called when a request is taken off the active list
  15. *
  16. * 20082000 Dave Jones <[email protected]> :
  17. * Removed tests for max-bomb-segments, which was breaking elvtune
  18. * when run without -bN
  19. *
  20. * Jens:
  21. * - Rework again to work with bio instead of buffer_heads
  22. * - loose bi_dev comparisons, partition handling is right now
  23. * - completely modularize elevator setup and teardown
  24. *
  25. */
  26. #include <linux/kernel.h>
  27. #include <linux/fs.h>
  28. #include <linux/blkdev.h>
  29. #include <linux/bio.h>
  30. #include <linux/module.h>
  31. #include <linux/slab.h>
  32. #include <linux/init.h>
  33. #include <linux/compiler.h>
  34. #include <linux/blktrace_api.h>
  35. #include <linux/hash.h>
  36. #include <linux/uaccess.h>
  37. #include <linux/pm_runtime.h>
  38. #include <trace/events/block.h>
  39. #include "elevator.h"
  40. #include "blk.h"
  41. #include "blk-mq-sched.h"
  42. #include "blk-pm.h"
  43. #include "blk-wbt.h"
  44. #include "blk-cgroup.h"
  45. static DEFINE_SPINLOCK(elv_list_lock);
  46. static LIST_HEAD(elv_list);
  47. /*
  48. * Merge hash stuff.
  49. */
  50. #define rq_hash_key(rq) (blk_rq_pos(rq) + blk_rq_sectors(rq))
  51. /*
  52. * Query io scheduler to see if the current process issuing bio may be
  53. * merged with rq.
  54. */
  55. static int elv_iosched_allow_bio_merge(struct request *rq, struct bio *bio)
  56. {
  57. struct request_queue *q = rq->q;
  58. struct elevator_queue *e = q->elevator;
  59. if (e->type->ops.allow_merge)
  60. return e->type->ops.allow_merge(q, rq, bio);
  61. return 1;
  62. }
  63. /*
  64. * can we safely merge with this request?
  65. */
  66. bool elv_bio_merge_ok(struct request *rq, struct bio *bio)
  67. {
  68. if (!blk_rq_merge_ok(rq, bio))
  69. return false;
  70. if (!elv_iosched_allow_bio_merge(rq, bio))
  71. return false;
  72. return true;
  73. }
  74. EXPORT_SYMBOL(elv_bio_merge_ok);
  75. static inline bool elv_support_features(unsigned int elv_features,
  76. unsigned int required_features)
  77. {
  78. return (required_features & elv_features) == required_features;
  79. }
  80. /**
  81. * elevator_match - Test an elevator name and features
  82. * @e: Scheduler to test
  83. * @name: Elevator name to test
  84. * @required_features: Features that the elevator must provide
  85. *
  86. * Return true if the elevator @e name matches @name and if @e provides all
  87. * the features specified by @required_features.
  88. */
  89. static bool elevator_match(const struct elevator_type *e, const char *name,
  90. unsigned int required_features)
  91. {
  92. if (!elv_support_features(e->elevator_features, required_features))
  93. return false;
  94. if (!strcmp(e->elevator_name, name))
  95. return true;
  96. if (e->elevator_alias && !strcmp(e->elevator_alias, name))
  97. return true;
  98. return false;
  99. }
  100. /**
  101. * elevator_find - Find an elevator
  102. * @name: Name of the elevator to find
  103. * @required_features: Features that the elevator must provide
  104. *
  105. * Return the first registered scheduler with name @name and supporting the
  106. * features @required_features and NULL otherwise.
  107. */
  108. static struct elevator_type *elevator_find(const char *name,
  109. unsigned int required_features)
  110. {
  111. struct elevator_type *e;
  112. list_for_each_entry(e, &elv_list, list) {
  113. if (elevator_match(e, name, required_features))
  114. return e;
  115. }
  116. return NULL;
  117. }
  118. static void elevator_put(struct elevator_type *e)
  119. {
  120. module_put(e->elevator_owner);
  121. }
  122. static struct elevator_type *elevator_get(struct request_queue *q,
  123. const char *name, bool try_loading)
  124. {
  125. struct elevator_type *e;
  126. spin_lock(&elv_list_lock);
  127. e = elevator_find(name, q->required_elevator_features);
  128. if (!e && try_loading) {
  129. spin_unlock(&elv_list_lock);
  130. request_module("%s-iosched", name);
  131. spin_lock(&elv_list_lock);
  132. e = elevator_find(name, q->required_elevator_features);
  133. }
  134. if (e && !try_module_get(e->elevator_owner))
  135. e = NULL;
  136. spin_unlock(&elv_list_lock);
  137. return e;
  138. }
  139. static struct kobj_type elv_ktype;
  140. struct elevator_queue *elevator_alloc(struct request_queue *q,
  141. struct elevator_type *e)
  142. {
  143. struct elevator_queue *eq;
  144. eq = kzalloc_node(sizeof(*eq), GFP_KERNEL, q->node);
  145. if (unlikely(!eq))
  146. return NULL;
  147. eq->type = e;
  148. kobject_init(&eq->kobj, &elv_ktype);
  149. mutex_init(&eq->sysfs_lock);
  150. hash_init(eq->hash);
  151. return eq;
  152. }
  153. EXPORT_SYMBOL(elevator_alloc);
  154. static void elevator_release(struct kobject *kobj)
  155. {
  156. struct elevator_queue *e;
  157. e = container_of(kobj, struct elevator_queue, kobj);
  158. elevator_put(e->type);
  159. kfree(e);
  160. }
  161. void elevator_exit(struct request_queue *q)
  162. {
  163. struct elevator_queue *e = q->elevator;
  164. ioc_clear_queue(q);
  165. blk_mq_sched_free_rqs(q);
  166. mutex_lock(&e->sysfs_lock);
  167. blk_mq_exit_sched(q, e);
  168. mutex_unlock(&e->sysfs_lock);
  169. kobject_put(&e->kobj);
  170. }
  171. static inline void __elv_rqhash_del(struct request *rq)
  172. {
  173. hash_del(&rq->hash);
  174. rq->rq_flags &= ~RQF_HASHED;
  175. }
  176. void elv_rqhash_del(struct request_queue *q, struct request *rq)
  177. {
  178. if (ELV_ON_HASH(rq))
  179. __elv_rqhash_del(rq);
  180. }
  181. EXPORT_SYMBOL_GPL(elv_rqhash_del);
  182. void elv_rqhash_add(struct request_queue *q, struct request *rq)
  183. {
  184. struct elevator_queue *e = q->elevator;
  185. BUG_ON(ELV_ON_HASH(rq));
  186. hash_add(e->hash, &rq->hash, rq_hash_key(rq));
  187. rq->rq_flags |= RQF_HASHED;
  188. }
  189. EXPORT_SYMBOL_GPL(elv_rqhash_add);
  190. void elv_rqhash_reposition(struct request_queue *q, struct request *rq)
  191. {
  192. __elv_rqhash_del(rq);
  193. elv_rqhash_add(q, rq);
  194. }
  195. struct request *elv_rqhash_find(struct request_queue *q, sector_t offset)
  196. {
  197. struct elevator_queue *e = q->elevator;
  198. struct hlist_node *next;
  199. struct request *rq;
  200. hash_for_each_possible_safe(e->hash, rq, next, hash, offset) {
  201. BUG_ON(!ELV_ON_HASH(rq));
  202. if (unlikely(!rq_mergeable(rq))) {
  203. __elv_rqhash_del(rq);
  204. continue;
  205. }
  206. if (rq_hash_key(rq) == offset)
  207. return rq;
  208. }
  209. return NULL;
  210. }
  211. /*
  212. * RB-tree support functions for inserting/lookup/removal of requests
  213. * in a sorted RB tree.
  214. */
  215. void elv_rb_add(struct rb_root *root, struct request *rq)
  216. {
  217. struct rb_node **p = &root->rb_node;
  218. struct rb_node *parent = NULL;
  219. struct request *__rq;
  220. while (*p) {
  221. parent = *p;
  222. __rq = rb_entry(parent, struct request, rb_node);
  223. if (blk_rq_pos(rq) < blk_rq_pos(__rq))
  224. p = &(*p)->rb_left;
  225. else if (blk_rq_pos(rq) >= blk_rq_pos(__rq))
  226. p = &(*p)->rb_right;
  227. }
  228. rb_link_node(&rq->rb_node, parent, p);
  229. rb_insert_color(&rq->rb_node, root);
  230. }
  231. EXPORT_SYMBOL(elv_rb_add);
  232. void elv_rb_del(struct rb_root *root, struct request *rq)
  233. {
  234. BUG_ON(RB_EMPTY_NODE(&rq->rb_node));
  235. rb_erase(&rq->rb_node, root);
  236. RB_CLEAR_NODE(&rq->rb_node);
  237. }
  238. EXPORT_SYMBOL(elv_rb_del);
  239. struct request *elv_rb_find(struct rb_root *root, sector_t sector)
  240. {
  241. struct rb_node *n = root->rb_node;
  242. struct request *rq;
  243. while (n) {
  244. rq = rb_entry(n, struct request, rb_node);
  245. if (sector < blk_rq_pos(rq))
  246. n = n->rb_left;
  247. else if (sector > blk_rq_pos(rq))
  248. n = n->rb_right;
  249. else
  250. return rq;
  251. }
  252. return NULL;
  253. }
  254. EXPORT_SYMBOL(elv_rb_find);
  255. enum elv_merge elv_merge(struct request_queue *q, struct request **req,
  256. struct bio *bio)
  257. {
  258. struct elevator_queue *e = q->elevator;
  259. struct request *__rq;
  260. /*
  261. * Levels of merges:
  262. * nomerges: No merges at all attempted
  263. * noxmerges: Only simple one-hit cache try
  264. * merges: All merge tries attempted
  265. */
  266. if (blk_queue_nomerges(q) || !bio_mergeable(bio))
  267. return ELEVATOR_NO_MERGE;
  268. /*
  269. * First try one-hit cache.
  270. */
  271. if (q->last_merge && elv_bio_merge_ok(q->last_merge, bio)) {
  272. enum elv_merge ret = blk_try_merge(q->last_merge, bio);
  273. if (ret != ELEVATOR_NO_MERGE) {
  274. *req = q->last_merge;
  275. return ret;
  276. }
  277. }
  278. if (blk_queue_noxmerges(q))
  279. return ELEVATOR_NO_MERGE;
  280. /*
  281. * See if our hash lookup can find a potential backmerge.
  282. */
  283. __rq = elv_rqhash_find(q, bio->bi_iter.bi_sector);
  284. if (__rq && elv_bio_merge_ok(__rq, bio)) {
  285. *req = __rq;
  286. if (blk_discard_mergable(__rq))
  287. return ELEVATOR_DISCARD_MERGE;
  288. return ELEVATOR_BACK_MERGE;
  289. }
  290. if (e->type->ops.request_merge)
  291. return e->type->ops.request_merge(q, req, bio);
  292. return ELEVATOR_NO_MERGE;
  293. }
  294. /*
  295. * Attempt to do an insertion back merge. Only check for the case where
  296. * we can append 'rq' to an existing request, so we can throw 'rq' away
  297. * afterwards.
  298. *
  299. * Returns true if we merged, false otherwise. 'free' will contain all
  300. * requests that need to be freed.
  301. */
  302. bool elv_attempt_insert_merge(struct request_queue *q, struct request *rq,
  303. struct list_head *free)
  304. {
  305. struct request *__rq;
  306. bool ret;
  307. if (blk_queue_nomerges(q))
  308. return false;
  309. /*
  310. * First try one-hit cache.
  311. */
  312. if (q->last_merge && blk_attempt_req_merge(q, q->last_merge, rq)) {
  313. list_add(&rq->queuelist, free);
  314. return true;
  315. }
  316. if (blk_queue_noxmerges(q))
  317. return false;
  318. ret = false;
  319. /*
  320. * See if our hash lookup can find a potential backmerge.
  321. */
  322. while (1) {
  323. __rq = elv_rqhash_find(q, blk_rq_pos(rq));
  324. if (!__rq || !blk_attempt_req_merge(q, __rq, rq))
  325. break;
  326. list_add(&rq->queuelist, free);
  327. /* The merged request could be merged with others, try again */
  328. ret = true;
  329. rq = __rq;
  330. }
  331. return ret;
  332. }
  333. void elv_merged_request(struct request_queue *q, struct request *rq,
  334. enum elv_merge type)
  335. {
  336. struct elevator_queue *e = q->elevator;
  337. if (e->type->ops.request_merged)
  338. e->type->ops.request_merged(q, rq, type);
  339. if (type == ELEVATOR_BACK_MERGE)
  340. elv_rqhash_reposition(q, rq);
  341. q->last_merge = rq;
  342. }
  343. void elv_merge_requests(struct request_queue *q, struct request *rq,
  344. struct request *next)
  345. {
  346. struct elevator_queue *e = q->elevator;
  347. if (e->type->ops.requests_merged)
  348. e->type->ops.requests_merged(q, rq, next);
  349. elv_rqhash_reposition(q, rq);
  350. q->last_merge = rq;
  351. }
  352. struct request *elv_latter_request(struct request_queue *q, struct request *rq)
  353. {
  354. struct elevator_queue *e = q->elevator;
  355. if (e->type->ops.next_request)
  356. return e->type->ops.next_request(q, rq);
  357. return NULL;
  358. }
  359. struct request *elv_former_request(struct request_queue *q, struct request *rq)
  360. {
  361. struct elevator_queue *e = q->elevator;
  362. if (e->type->ops.former_request)
  363. return e->type->ops.former_request(q, rq);
  364. return NULL;
  365. }
  366. #define to_elv(atr) container_of((atr), struct elv_fs_entry, attr)
  367. static ssize_t
  368. elv_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
  369. {
  370. struct elv_fs_entry *entry = to_elv(attr);
  371. struct elevator_queue *e;
  372. ssize_t error;
  373. if (!entry->show)
  374. return -EIO;
  375. e = container_of(kobj, struct elevator_queue, kobj);
  376. mutex_lock(&e->sysfs_lock);
  377. error = e->type ? entry->show(e, page) : -ENOENT;
  378. mutex_unlock(&e->sysfs_lock);
  379. return error;
  380. }
  381. static ssize_t
  382. elv_attr_store(struct kobject *kobj, struct attribute *attr,
  383. const char *page, size_t length)
  384. {
  385. struct elv_fs_entry *entry = to_elv(attr);
  386. struct elevator_queue *e;
  387. ssize_t error;
  388. if (!entry->store)
  389. return -EIO;
  390. e = container_of(kobj, struct elevator_queue, kobj);
  391. mutex_lock(&e->sysfs_lock);
  392. error = e->type ? entry->store(e, page, length) : -ENOENT;
  393. mutex_unlock(&e->sysfs_lock);
  394. return error;
  395. }
  396. static const struct sysfs_ops elv_sysfs_ops = {
  397. .show = elv_attr_show,
  398. .store = elv_attr_store,
  399. };
  400. static struct kobj_type elv_ktype = {
  401. .sysfs_ops = &elv_sysfs_ops,
  402. .release = elevator_release,
  403. };
  404. int elv_register_queue(struct request_queue *q, bool uevent)
  405. {
  406. struct elevator_queue *e = q->elevator;
  407. int error;
  408. lockdep_assert_held(&q->sysfs_lock);
  409. error = kobject_add(&e->kobj, &q->kobj, "%s", "iosched");
  410. if (!error) {
  411. struct elv_fs_entry *attr = e->type->elevator_attrs;
  412. if (attr) {
  413. while (attr->attr.name) {
  414. if (sysfs_create_file(&e->kobj, &attr->attr))
  415. break;
  416. attr++;
  417. }
  418. }
  419. if (uevent)
  420. kobject_uevent(&e->kobj, KOBJ_ADD);
  421. e->registered = 1;
  422. }
  423. return error;
  424. }
  425. void elv_unregister_queue(struct request_queue *q)
  426. {
  427. struct elevator_queue *e = q->elevator;
  428. lockdep_assert_held(&q->sysfs_lock);
  429. if (e && e->registered) {
  430. struct elevator_queue *e = q->elevator;
  431. kobject_uevent(&e->kobj, KOBJ_REMOVE);
  432. kobject_del(&e->kobj);
  433. e->registered = 0;
  434. }
  435. }
  436. int elv_register(struct elevator_type *e)
  437. {
  438. /* insert_requests and dispatch_request are mandatory */
  439. if (WARN_ON_ONCE(!e->ops.insert_requests || !e->ops.dispatch_request))
  440. return -EINVAL;
  441. /* create icq_cache if requested */
  442. if (e->icq_size) {
  443. if (WARN_ON(e->icq_size < sizeof(struct io_cq)) ||
  444. WARN_ON(e->icq_align < __alignof__(struct io_cq)))
  445. return -EINVAL;
  446. snprintf(e->icq_cache_name, sizeof(e->icq_cache_name),
  447. "%s_io_cq", e->elevator_name);
  448. e->icq_cache = kmem_cache_create(e->icq_cache_name, e->icq_size,
  449. e->icq_align, 0, NULL);
  450. if (!e->icq_cache)
  451. return -ENOMEM;
  452. }
  453. /* register, don't allow duplicate names */
  454. spin_lock(&elv_list_lock);
  455. if (elevator_find(e->elevator_name, 0)) {
  456. spin_unlock(&elv_list_lock);
  457. kmem_cache_destroy(e->icq_cache);
  458. return -EBUSY;
  459. }
  460. list_add_tail(&e->list, &elv_list);
  461. spin_unlock(&elv_list_lock);
  462. printk(KERN_INFO "io scheduler %s registered\n", e->elevator_name);
  463. return 0;
  464. }
  465. EXPORT_SYMBOL_GPL(elv_register);
  466. void elv_unregister(struct elevator_type *e)
  467. {
  468. /* unregister */
  469. spin_lock(&elv_list_lock);
  470. list_del_init(&e->list);
  471. spin_unlock(&elv_list_lock);
  472. /*
  473. * Destroy icq_cache if it exists. icq's are RCU managed. Make
  474. * sure all RCU operations are complete before proceeding.
  475. */
  476. if (e->icq_cache) {
  477. rcu_barrier();
  478. kmem_cache_destroy(e->icq_cache);
  479. e->icq_cache = NULL;
  480. }
  481. }
  482. EXPORT_SYMBOL_GPL(elv_unregister);
  483. static int elevator_switch_mq(struct request_queue *q,
  484. struct elevator_type *new_e)
  485. {
  486. int ret;
  487. lockdep_assert_held(&q->sysfs_lock);
  488. if (q->elevator) {
  489. elv_unregister_queue(q);
  490. elevator_exit(q);
  491. }
  492. ret = blk_mq_init_sched(q, new_e);
  493. if (ret)
  494. goto out;
  495. if (new_e) {
  496. ret = elv_register_queue(q, true);
  497. if (ret) {
  498. elevator_exit(q);
  499. goto out;
  500. }
  501. }
  502. if (new_e)
  503. blk_add_trace_msg(q, "elv switch: %s", new_e->elevator_name);
  504. else
  505. blk_add_trace_msg(q, "elv switch: none");
  506. out:
  507. return ret;
  508. }
  509. static inline bool elv_support_iosched(struct request_queue *q)
  510. {
  511. if (!queue_is_mq(q) ||
  512. (q->tag_set && (q->tag_set->flags & BLK_MQ_F_NO_SCHED)))
  513. return false;
  514. return true;
  515. }
  516. /*
  517. * For single queue devices, default to using mq-deadline. If we have multiple
  518. * queues or mq-deadline is not available, default to "none".
  519. */
  520. static struct elevator_type *elevator_get_default(struct request_queue *q)
  521. {
  522. if (q->tag_set && q->tag_set->flags & BLK_MQ_F_NO_SCHED_BY_DEFAULT)
  523. return NULL;
  524. if (q->nr_hw_queues != 1 &&
  525. !blk_mq_is_shared_tags(q->tag_set->flags))
  526. return NULL;
  527. return elevator_get(q, "mq-deadline", false);
  528. }
  529. /*
  530. * Get the first elevator providing the features required by the request queue.
  531. * Default to "none" if no matching elevator is found.
  532. */
  533. static struct elevator_type *elevator_get_by_features(struct request_queue *q)
  534. {
  535. struct elevator_type *e, *found = NULL;
  536. spin_lock(&elv_list_lock);
  537. list_for_each_entry(e, &elv_list, list) {
  538. if (elv_support_features(e->elevator_features,
  539. q->required_elevator_features)) {
  540. found = e;
  541. break;
  542. }
  543. }
  544. if (found && !try_module_get(found->elevator_owner))
  545. found = NULL;
  546. spin_unlock(&elv_list_lock);
  547. return found;
  548. }
  549. /*
  550. * For a device queue that has no required features, use the default elevator
  551. * settings. Otherwise, use the first elevator available matching the required
  552. * features. If no suitable elevator is find or if the chosen elevator
  553. * initialization fails, fall back to the "none" elevator (no elevator).
  554. */
  555. void elevator_init_mq(struct request_queue *q)
  556. {
  557. struct elevator_type *e;
  558. int err;
  559. if (!elv_support_iosched(q))
  560. return;
  561. WARN_ON_ONCE(blk_queue_registered(q));
  562. if (unlikely(q->elevator))
  563. return;
  564. if (!q->required_elevator_features)
  565. e = elevator_get_default(q);
  566. else
  567. e = elevator_get_by_features(q);
  568. if (!e)
  569. return;
  570. /*
  571. * We are called before adding disk, when there isn't any FS I/O,
  572. * so freezing queue plus canceling dispatch work is enough to
  573. * drain any dispatch activities originated from passthrough
  574. * requests, then no need to quiesce queue which may add long boot
  575. * latency, especially when lots of disks are involved.
  576. */
  577. blk_mq_freeze_queue(q);
  578. blk_mq_cancel_work_sync(q);
  579. err = blk_mq_init_sched(q, e);
  580. blk_mq_unfreeze_queue(q);
  581. if (err) {
  582. pr_warn("\"%s\" elevator initialization failed, "
  583. "falling back to \"none\"\n", e->elevator_name);
  584. elevator_put(e);
  585. }
  586. }
  587. /*
  588. * switch to new_e io scheduler. be careful not to introduce deadlocks -
  589. * we don't free the old io scheduler, before we have allocated what we
  590. * need for the new one. this way we have a chance of going back to the old
  591. * one, if the new one fails init for some reason.
  592. */
  593. int elevator_switch(struct request_queue *q, struct elevator_type *new_e)
  594. {
  595. int err;
  596. lockdep_assert_held(&q->sysfs_lock);
  597. blk_mq_freeze_queue(q);
  598. blk_mq_quiesce_queue(q);
  599. err = elevator_switch_mq(q, new_e);
  600. blk_mq_unquiesce_queue(q);
  601. blk_mq_unfreeze_queue(q);
  602. return err;
  603. }
  604. /*
  605. * Switch this queue to the given IO scheduler.
  606. */
  607. static int __elevator_change(struct request_queue *q, const char *name)
  608. {
  609. char elevator_name[ELV_NAME_MAX];
  610. struct elevator_type *e;
  611. /* Make sure queue is not in the middle of being removed */
  612. if (!blk_queue_registered(q))
  613. return -ENOENT;
  614. /*
  615. * Special case for mq, turn off scheduling
  616. */
  617. if (!strncmp(name, "none", 4)) {
  618. if (!q->elevator)
  619. return 0;
  620. return elevator_switch(q, NULL);
  621. }
  622. strlcpy(elevator_name, name, sizeof(elevator_name));
  623. e = elevator_get(q, strstrip(elevator_name), true);
  624. if (!e)
  625. return -EINVAL;
  626. if (q->elevator &&
  627. elevator_match(q->elevator->type, elevator_name, 0)) {
  628. elevator_put(e);
  629. return 0;
  630. }
  631. return elevator_switch(q, e);
  632. }
  633. ssize_t elv_iosched_store(struct request_queue *q, const char *name,
  634. size_t count)
  635. {
  636. int ret;
  637. if (!elv_support_iosched(q))
  638. return count;
  639. ret = __elevator_change(q, name);
  640. if (!ret)
  641. return count;
  642. return ret;
  643. }
  644. ssize_t elv_iosched_show(struct request_queue *q, char *name)
  645. {
  646. struct elevator_queue *e = q->elevator;
  647. struct elevator_type *elv = NULL;
  648. struct elevator_type *__e;
  649. int len = 0;
  650. if (!queue_is_mq(q))
  651. return sprintf(name, "none\n");
  652. if (!q->elevator)
  653. len += sprintf(name+len, "[none] ");
  654. else
  655. elv = e->type;
  656. spin_lock(&elv_list_lock);
  657. list_for_each_entry(__e, &elv_list, list) {
  658. if (elv && elevator_match(elv, __e->elevator_name, 0)) {
  659. len += sprintf(name+len, "[%s] ", elv->elevator_name);
  660. continue;
  661. }
  662. if (elv_support_iosched(q) &&
  663. elevator_match(__e, __e->elevator_name,
  664. q->required_elevator_features))
  665. len += sprintf(name+len, "%s ", __e->elevator_name);
  666. }
  667. spin_unlock(&elv_list_lock);
  668. if (q->elevator)
  669. len += sprintf(name+len, "none");
  670. len += sprintf(len+name, "\n");
  671. return len;
  672. }
  673. struct request *elv_rb_former_request(struct request_queue *q,
  674. struct request *rq)
  675. {
  676. struct rb_node *rbprev = rb_prev(&rq->rb_node);
  677. if (rbprev)
  678. return rb_entry_rq(rbprev);
  679. return NULL;
  680. }
  681. EXPORT_SYMBOL(elv_rb_former_request);
  682. struct request *elv_rb_latter_request(struct request_queue *q,
  683. struct request *rq)
  684. {
  685. struct rb_node *rbnext = rb_next(&rq->rb_node);
  686. if (rbnext)
  687. return rb_entry_rq(rbnext);
  688. return NULL;
  689. }
  690. EXPORT_SYMBOL(elv_rb_latter_request);
  691. static int __init elevator_setup(char *str)
  692. {
  693. pr_warn("Kernel parameter elevator= does not have any effect anymore.\n"
  694. "Please use sysfs to set IO scheduler for individual devices.\n");
  695. return 1;
  696. }
  697. __setup("elevator=", elevator_setup);