sch_gred.c 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947
  1. // SPDX-License-Identifier: GPL-2.0-or-later
  2. /*
  3. * net/sched/sch_gred.c Generic Random Early Detection queue.
  4. *
  5. * Authors: J Hadi Salim ([email protected]) 1998-2002
  6. *
  7. * 991129: - Bug fix with grio mode
  8. * - a better sing. AvgQ mode with Grio(WRED)
  9. * - A finer grained VQ dequeue based on suggestion
  10. * from Ren Liu
  11. * - More error checks
  12. *
  13. * For all the glorious comments look at include/net/red.h
  14. */
  15. #include <linux/slab.h>
  16. #include <linux/module.h>
  17. #include <linux/types.h>
  18. #include <linux/kernel.h>
  19. #include <linux/skbuff.h>
  20. #include <net/pkt_cls.h>
  21. #include <net/pkt_sched.h>
  22. #include <net/red.h>
  23. #define GRED_DEF_PRIO (MAX_DPs / 2)
  24. #define GRED_VQ_MASK (MAX_DPs - 1)
  25. #define GRED_VQ_RED_FLAGS (TC_RED_ECN | TC_RED_HARDDROP)
  26. struct gred_sched_data;
  27. struct gred_sched;
  28. struct gred_sched_data {
  29. u32 limit; /* HARD maximal queue length */
  30. u32 DP; /* the drop parameters */
  31. u32 red_flags; /* virtualQ version of red_flags */
  32. u64 bytesin; /* bytes seen on virtualQ so far*/
  33. u32 packetsin; /* packets seen on virtualQ so far*/
  34. u32 backlog; /* bytes on the virtualQ */
  35. u8 prio; /* the prio of this vq */
  36. struct red_parms parms;
  37. struct red_vars vars;
  38. struct red_stats stats;
  39. };
  40. enum {
  41. GRED_WRED_MODE = 1,
  42. GRED_RIO_MODE,
  43. };
  44. struct gred_sched {
  45. struct gred_sched_data *tab[MAX_DPs];
  46. unsigned long flags;
  47. u32 red_flags;
  48. u32 DPs;
  49. u32 def;
  50. struct red_vars wred_set;
  51. struct tc_gred_qopt_offload *opt;
  52. };
  53. static inline int gred_wred_mode(struct gred_sched *table)
  54. {
  55. return test_bit(GRED_WRED_MODE, &table->flags);
  56. }
  57. static inline void gred_enable_wred_mode(struct gred_sched *table)
  58. {
  59. __set_bit(GRED_WRED_MODE, &table->flags);
  60. }
  61. static inline void gred_disable_wred_mode(struct gred_sched *table)
  62. {
  63. __clear_bit(GRED_WRED_MODE, &table->flags);
  64. }
  65. static inline int gred_rio_mode(struct gred_sched *table)
  66. {
  67. return test_bit(GRED_RIO_MODE, &table->flags);
  68. }
  69. static inline void gred_enable_rio_mode(struct gred_sched *table)
  70. {
  71. __set_bit(GRED_RIO_MODE, &table->flags);
  72. }
  73. static inline void gred_disable_rio_mode(struct gred_sched *table)
  74. {
  75. __clear_bit(GRED_RIO_MODE, &table->flags);
  76. }
  77. static inline int gred_wred_mode_check(struct Qdisc *sch)
  78. {
  79. struct gred_sched *table = qdisc_priv(sch);
  80. int i;
  81. /* Really ugly O(n^2) but shouldn't be necessary too frequent. */
  82. for (i = 0; i < table->DPs; i++) {
  83. struct gred_sched_data *q = table->tab[i];
  84. int n;
  85. if (q == NULL)
  86. continue;
  87. for (n = i + 1; n < table->DPs; n++)
  88. if (table->tab[n] && table->tab[n]->prio == q->prio)
  89. return 1;
  90. }
  91. return 0;
  92. }
  93. static inline unsigned int gred_backlog(struct gred_sched *table,
  94. struct gred_sched_data *q,
  95. struct Qdisc *sch)
  96. {
  97. if (gred_wred_mode(table))
  98. return sch->qstats.backlog;
  99. else
  100. return q->backlog;
  101. }
  102. static inline u16 tc_index_to_dp(struct sk_buff *skb)
  103. {
  104. return skb->tc_index & GRED_VQ_MASK;
  105. }
  106. static inline void gred_load_wred_set(const struct gred_sched *table,
  107. struct gred_sched_data *q)
  108. {
  109. q->vars.qavg = table->wred_set.qavg;
  110. q->vars.qidlestart = table->wred_set.qidlestart;
  111. }
  112. static inline void gred_store_wred_set(struct gred_sched *table,
  113. struct gred_sched_data *q)
  114. {
  115. table->wred_set.qavg = q->vars.qavg;
  116. table->wred_set.qidlestart = q->vars.qidlestart;
  117. }
  118. static int gred_use_ecn(struct gred_sched_data *q)
  119. {
  120. return q->red_flags & TC_RED_ECN;
  121. }
  122. static int gred_use_harddrop(struct gred_sched_data *q)
  123. {
  124. return q->red_flags & TC_RED_HARDDROP;
  125. }
  126. static bool gred_per_vq_red_flags_used(struct gred_sched *table)
  127. {
  128. unsigned int i;
  129. /* Local per-vq flags couldn't have been set unless global are 0 */
  130. if (table->red_flags)
  131. return false;
  132. for (i = 0; i < MAX_DPs; i++)
  133. if (table->tab[i] && table->tab[i]->red_flags)
  134. return true;
  135. return false;
  136. }
  137. static int gred_enqueue(struct sk_buff *skb, struct Qdisc *sch,
  138. struct sk_buff **to_free)
  139. {
  140. struct gred_sched_data *q = NULL;
  141. struct gred_sched *t = qdisc_priv(sch);
  142. unsigned long qavg = 0;
  143. u16 dp = tc_index_to_dp(skb);
  144. if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
  145. dp = t->def;
  146. q = t->tab[dp];
  147. if (!q) {
  148. /* Pass through packets not assigned to a DP
  149. * if no default DP has been configured. This
  150. * allows for DP flows to be left untouched.
  151. */
  152. if (likely(sch->qstats.backlog + qdisc_pkt_len(skb) <=
  153. sch->limit))
  154. return qdisc_enqueue_tail(skb, sch);
  155. else
  156. goto drop;
  157. }
  158. /* fix tc_index? --could be controversial but needed for
  159. requeueing */
  160. skb->tc_index = (skb->tc_index & ~GRED_VQ_MASK) | dp;
  161. }
  162. /* sum up all the qaves of prios < ours to get the new qave */
  163. if (!gred_wred_mode(t) && gred_rio_mode(t)) {
  164. int i;
  165. for (i = 0; i < t->DPs; i++) {
  166. if (t->tab[i] && t->tab[i]->prio < q->prio &&
  167. !red_is_idling(&t->tab[i]->vars))
  168. qavg += t->tab[i]->vars.qavg;
  169. }
  170. }
  171. q->packetsin++;
  172. q->bytesin += qdisc_pkt_len(skb);
  173. if (gred_wred_mode(t))
  174. gred_load_wred_set(t, q);
  175. q->vars.qavg = red_calc_qavg(&q->parms,
  176. &q->vars,
  177. gred_backlog(t, q, sch));
  178. if (red_is_idling(&q->vars))
  179. red_end_of_idle_period(&q->vars);
  180. if (gred_wred_mode(t))
  181. gred_store_wred_set(t, q);
  182. switch (red_action(&q->parms, &q->vars, q->vars.qavg + qavg)) {
  183. case RED_DONT_MARK:
  184. break;
  185. case RED_PROB_MARK:
  186. qdisc_qstats_overlimit(sch);
  187. if (!gred_use_ecn(q) || !INET_ECN_set_ce(skb)) {
  188. q->stats.prob_drop++;
  189. goto congestion_drop;
  190. }
  191. q->stats.prob_mark++;
  192. break;
  193. case RED_HARD_MARK:
  194. qdisc_qstats_overlimit(sch);
  195. if (gred_use_harddrop(q) || !gred_use_ecn(q) ||
  196. !INET_ECN_set_ce(skb)) {
  197. q->stats.forced_drop++;
  198. goto congestion_drop;
  199. }
  200. q->stats.forced_mark++;
  201. break;
  202. }
  203. if (gred_backlog(t, q, sch) + qdisc_pkt_len(skb) <= q->limit) {
  204. q->backlog += qdisc_pkt_len(skb);
  205. return qdisc_enqueue_tail(skb, sch);
  206. }
  207. q->stats.pdrop++;
  208. drop:
  209. return qdisc_drop(skb, sch, to_free);
  210. congestion_drop:
  211. qdisc_drop(skb, sch, to_free);
  212. return NET_XMIT_CN;
  213. }
  214. static struct sk_buff *gred_dequeue(struct Qdisc *sch)
  215. {
  216. struct sk_buff *skb;
  217. struct gred_sched *t = qdisc_priv(sch);
  218. skb = qdisc_dequeue_head(sch);
  219. if (skb) {
  220. struct gred_sched_data *q;
  221. u16 dp = tc_index_to_dp(skb);
  222. if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
  223. net_warn_ratelimited("GRED: Unable to relocate VQ 0x%x after dequeue, screwing up backlog\n",
  224. tc_index_to_dp(skb));
  225. } else {
  226. q->backlog -= qdisc_pkt_len(skb);
  227. if (gred_wred_mode(t)) {
  228. if (!sch->qstats.backlog)
  229. red_start_of_idle_period(&t->wred_set);
  230. } else {
  231. if (!q->backlog)
  232. red_start_of_idle_period(&q->vars);
  233. }
  234. }
  235. return skb;
  236. }
  237. return NULL;
  238. }
  239. static void gred_reset(struct Qdisc *sch)
  240. {
  241. int i;
  242. struct gred_sched *t = qdisc_priv(sch);
  243. qdisc_reset_queue(sch);
  244. for (i = 0; i < t->DPs; i++) {
  245. struct gred_sched_data *q = t->tab[i];
  246. if (!q)
  247. continue;
  248. red_restart(&q->vars);
  249. q->backlog = 0;
  250. }
  251. }
  252. static void gred_offload(struct Qdisc *sch, enum tc_gred_command command)
  253. {
  254. struct gred_sched *table = qdisc_priv(sch);
  255. struct net_device *dev = qdisc_dev(sch);
  256. struct tc_gred_qopt_offload *opt = table->opt;
  257. if (!tc_can_offload(dev) || !dev->netdev_ops->ndo_setup_tc)
  258. return;
  259. memset(opt, 0, sizeof(*opt));
  260. opt->command = command;
  261. opt->handle = sch->handle;
  262. opt->parent = sch->parent;
  263. if (command == TC_GRED_REPLACE) {
  264. unsigned int i;
  265. opt->set.grio_on = gred_rio_mode(table);
  266. opt->set.wred_on = gred_wred_mode(table);
  267. opt->set.dp_cnt = table->DPs;
  268. opt->set.dp_def = table->def;
  269. for (i = 0; i < table->DPs; i++) {
  270. struct gred_sched_data *q = table->tab[i];
  271. if (!q)
  272. continue;
  273. opt->set.tab[i].present = true;
  274. opt->set.tab[i].limit = q->limit;
  275. opt->set.tab[i].prio = q->prio;
  276. opt->set.tab[i].min = q->parms.qth_min >> q->parms.Wlog;
  277. opt->set.tab[i].max = q->parms.qth_max >> q->parms.Wlog;
  278. opt->set.tab[i].is_ecn = gred_use_ecn(q);
  279. opt->set.tab[i].is_harddrop = gred_use_harddrop(q);
  280. opt->set.tab[i].probability = q->parms.max_P;
  281. opt->set.tab[i].backlog = &q->backlog;
  282. }
  283. opt->set.qstats = &sch->qstats;
  284. }
  285. dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_QDISC_GRED, opt);
  286. }
  287. static int gred_offload_dump_stats(struct Qdisc *sch)
  288. {
  289. struct gred_sched *table = qdisc_priv(sch);
  290. struct tc_gred_qopt_offload *hw_stats;
  291. u64 bytes = 0, packets = 0;
  292. unsigned int i;
  293. int ret;
  294. hw_stats = kzalloc(sizeof(*hw_stats), GFP_KERNEL);
  295. if (!hw_stats)
  296. return -ENOMEM;
  297. hw_stats->command = TC_GRED_STATS;
  298. hw_stats->handle = sch->handle;
  299. hw_stats->parent = sch->parent;
  300. for (i = 0; i < MAX_DPs; i++) {
  301. gnet_stats_basic_sync_init(&hw_stats->stats.bstats[i]);
  302. if (table->tab[i])
  303. hw_stats->stats.xstats[i] = &table->tab[i]->stats;
  304. }
  305. ret = qdisc_offload_dump_helper(sch, TC_SETUP_QDISC_GRED, hw_stats);
  306. /* Even if driver returns failure adjust the stats - in case offload
  307. * ended but driver still wants to adjust the values.
  308. */
  309. sch_tree_lock(sch);
  310. for (i = 0; i < MAX_DPs; i++) {
  311. if (!table->tab[i])
  312. continue;
  313. table->tab[i]->packetsin += u64_stats_read(&hw_stats->stats.bstats[i].packets);
  314. table->tab[i]->bytesin += u64_stats_read(&hw_stats->stats.bstats[i].bytes);
  315. table->tab[i]->backlog += hw_stats->stats.qstats[i].backlog;
  316. bytes += u64_stats_read(&hw_stats->stats.bstats[i].bytes);
  317. packets += u64_stats_read(&hw_stats->stats.bstats[i].packets);
  318. sch->qstats.qlen += hw_stats->stats.qstats[i].qlen;
  319. sch->qstats.backlog += hw_stats->stats.qstats[i].backlog;
  320. sch->qstats.drops += hw_stats->stats.qstats[i].drops;
  321. sch->qstats.requeues += hw_stats->stats.qstats[i].requeues;
  322. sch->qstats.overlimits += hw_stats->stats.qstats[i].overlimits;
  323. }
  324. _bstats_update(&sch->bstats, bytes, packets);
  325. sch_tree_unlock(sch);
  326. kfree(hw_stats);
  327. return ret;
  328. }
  329. static inline void gred_destroy_vq(struct gred_sched_data *q)
  330. {
  331. kfree(q);
  332. }
  333. static int gred_change_table_def(struct Qdisc *sch, struct nlattr *dps,
  334. struct netlink_ext_ack *extack)
  335. {
  336. struct gred_sched *table = qdisc_priv(sch);
  337. struct tc_gred_sopt *sopt;
  338. bool red_flags_changed;
  339. int i;
  340. if (!dps)
  341. return -EINVAL;
  342. sopt = nla_data(dps);
  343. if (sopt->DPs > MAX_DPs) {
  344. NL_SET_ERR_MSG_MOD(extack, "number of virtual queues too high");
  345. return -EINVAL;
  346. }
  347. if (sopt->DPs == 0) {
  348. NL_SET_ERR_MSG_MOD(extack,
  349. "number of virtual queues can't be 0");
  350. return -EINVAL;
  351. }
  352. if (sopt->def_DP >= sopt->DPs) {
  353. NL_SET_ERR_MSG_MOD(extack, "default virtual queue above virtual queue count");
  354. return -EINVAL;
  355. }
  356. if (sopt->flags && gred_per_vq_red_flags_used(table)) {
  357. NL_SET_ERR_MSG_MOD(extack, "can't set per-Qdisc RED flags when per-virtual queue flags are used");
  358. return -EINVAL;
  359. }
  360. sch_tree_lock(sch);
  361. table->DPs = sopt->DPs;
  362. table->def = sopt->def_DP;
  363. red_flags_changed = table->red_flags != sopt->flags;
  364. table->red_flags = sopt->flags;
  365. /*
  366. * Every entry point to GRED is synchronized with the above code
  367. * and the DP is checked against DPs, i.e. shadowed VQs can no
  368. * longer be found so we can unlock right here.
  369. */
  370. sch_tree_unlock(sch);
  371. if (sopt->grio) {
  372. gred_enable_rio_mode(table);
  373. gred_disable_wred_mode(table);
  374. if (gred_wred_mode_check(sch))
  375. gred_enable_wred_mode(table);
  376. } else {
  377. gred_disable_rio_mode(table);
  378. gred_disable_wred_mode(table);
  379. }
  380. if (red_flags_changed)
  381. for (i = 0; i < table->DPs; i++)
  382. if (table->tab[i])
  383. table->tab[i]->red_flags =
  384. table->red_flags & GRED_VQ_RED_FLAGS;
  385. for (i = table->DPs; i < MAX_DPs; i++) {
  386. if (table->tab[i]) {
  387. pr_warn("GRED: Warning: Destroying shadowed VQ 0x%x\n",
  388. i);
  389. gred_destroy_vq(table->tab[i]);
  390. table->tab[i] = NULL;
  391. }
  392. }
  393. gred_offload(sch, TC_GRED_REPLACE);
  394. return 0;
  395. }
  396. static inline int gred_change_vq(struct Qdisc *sch, int dp,
  397. struct tc_gred_qopt *ctl, int prio,
  398. u8 *stab, u32 max_P,
  399. struct gred_sched_data **prealloc,
  400. struct netlink_ext_ack *extack)
  401. {
  402. struct gred_sched *table = qdisc_priv(sch);
  403. struct gred_sched_data *q = table->tab[dp];
  404. if (!red_check_params(ctl->qth_min, ctl->qth_max, ctl->Wlog, ctl->Scell_log, stab)) {
  405. NL_SET_ERR_MSG_MOD(extack, "invalid RED parameters");
  406. return -EINVAL;
  407. }
  408. if (!q) {
  409. table->tab[dp] = q = *prealloc;
  410. *prealloc = NULL;
  411. if (!q)
  412. return -ENOMEM;
  413. q->red_flags = table->red_flags & GRED_VQ_RED_FLAGS;
  414. }
  415. q->DP = dp;
  416. q->prio = prio;
  417. if (ctl->limit > sch->limit)
  418. q->limit = sch->limit;
  419. else
  420. q->limit = ctl->limit;
  421. if (q->backlog == 0)
  422. red_end_of_idle_period(&q->vars);
  423. red_set_parms(&q->parms,
  424. ctl->qth_min, ctl->qth_max, ctl->Wlog, ctl->Plog,
  425. ctl->Scell_log, stab, max_P);
  426. red_set_vars(&q->vars);
  427. return 0;
  428. }
  429. static const struct nla_policy gred_vq_policy[TCA_GRED_VQ_MAX + 1] = {
  430. [TCA_GRED_VQ_DP] = { .type = NLA_U32 },
  431. [TCA_GRED_VQ_FLAGS] = { .type = NLA_U32 },
  432. };
  433. static const struct nla_policy gred_vqe_policy[TCA_GRED_VQ_ENTRY_MAX + 1] = {
  434. [TCA_GRED_VQ_ENTRY] = { .type = NLA_NESTED },
  435. };
  436. static const struct nla_policy gred_policy[TCA_GRED_MAX + 1] = {
  437. [TCA_GRED_PARMS] = { .len = sizeof(struct tc_gred_qopt) },
  438. [TCA_GRED_STAB] = { .len = 256 },
  439. [TCA_GRED_DPS] = { .len = sizeof(struct tc_gred_sopt) },
  440. [TCA_GRED_MAX_P] = { .type = NLA_U32 },
  441. [TCA_GRED_LIMIT] = { .type = NLA_U32 },
  442. [TCA_GRED_VQ_LIST] = { .type = NLA_NESTED },
  443. };
  444. static void gred_vq_apply(struct gred_sched *table, const struct nlattr *entry)
  445. {
  446. struct nlattr *tb[TCA_GRED_VQ_MAX + 1];
  447. u32 dp;
  448. nla_parse_nested_deprecated(tb, TCA_GRED_VQ_MAX, entry,
  449. gred_vq_policy, NULL);
  450. dp = nla_get_u32(tb[TCA_GRED_VQ_DP]);
  451. if (tb[TCA_GRED_VQ_FLAGS])
  452. table->tab[dp]->red_flags = nla_get_u32(tb[TCA_GRED_VQ_FLAGS]);
  453. }
  454. static void gred_vqs_apply(struct gred_sched *table, struct nlattr *vqs)
  455. {
  456. const struct nlattr *attr;
  457. int rem;
  458. nla_for_each_nested(attr, vqs, rem) {
  459. switch (nla_type(attr)) {
  460. case TCA_GRED_VQ_ENTRY:
  461. gred_vq_apply(table, attr);
  462. break;
  463. }
  464. }
  465. }
  466. static int gred_vq_validate(struct gred_sched *table, u32 cdp,
  467. const struct nlattr *entry,
  468. struct netlink_ext_ack *extack)
  469. {
  470. struct nlattr *tb[TCA_GRED_VQ_MAX + 1];
  471. int err;
  472. u32 dp;
  473. err = nla_parse_nested_deprecated(tb, TCA_GRED_VQ_MAX, entry,
  474. gred_vq_policy, extack);
  475. if (err < 0)
  476. return err;
  477. if (!tb[TCA_GRED_VQ_DP]) {
  478. NL_SET_ERR_MSG_MOD(extack, "Virtual queue with no index specified");
  479. return -EINVAL;
  480. }
  481. dp = nla_get_u32(tb[TCA_GRED_VQ_DP]);
  482. if (dp >= table->DPs) {
  483. NL_SET_ERR_MSG_MOD(extack, "Virtual queue with index out of bounds");
  484. return -EINVAL;
  485. }
  486. if (dp != cdp && !table->tab[dp]) {
  487. NL_SET_ERR_MSG_MOD(extack, "Virtual queue not yet instantiated");
  488. return -EINVAL;
  489. }
  490. if (tb[TCA_GRED_VQ_FLAGS]) {
  491. u32 red_flags = nla_get_u32(tb[TCA_GRED_VQ_FLAGS]);
  492. if (table->red_flags && table->red_flags != red_flags) {
  493. NL_SET_ERR_MSG_MOD(extack, "can't change per-virtual queue RED flags when per-Qdisc flags are used");
  494. return -EINVAL;
  495. }
  496. if (red_flags & ~GRED_VQ_RED_FLAGS) {
  497. NL_SET_ERR_MSG_MOD(extack,
  498. "invalid RED flags specified");
  499. return -EINVAL;
  500. }
  501. }
  502. return 0;
  503. }
  504. static int gred_vqs_validate(struct gred_sched *table, u32 cdp,
  505. struct nlattr *vqs, struct netlink_ext_ack *extack)
  506. {
  507. const struct nlattr *attr;
  508. int rem, err;
  509. err = nla_validate_nested_deprecated(vqs, TCA_GRED_VQ_ENTRY_MAX,
  510. gred_vqe_policy, extack);
  511. if (err < 0)
  512. return err;
  513. nla_for_each_nested(attr, vqs, rem) {
  514. switch (nla_type(attr)) {
  515. case TCA_GRED_VQ_ENTRY:
  516. err = gred_vq_validate(table, cdp, attr, extack);
  517. if (err)
  518. return err;
  519. break;
  520. default:
  521. NL_SET_ERR_MSG_MOD(extack, "GRED_VQ_LIST can contain only entry attributes");
  522. return -EINVAL;
  523. }
  524. }
  525. if (rem > 0) {
  526. NL_SET_ERR_MSG_MOD(extack, "Trailing data after parsing virtual queue list");
  527. return -EINVAL;
  528. }
  529. return 0;
  530. }
  531. static int gred_change(struct Qdisc *sch, struct nlattr *opt,
  532. struct netlink_ext_ack *extack)
  533. {
  534. struct gred_sched *table = qdisc_priv(sch);
  535. struct tc_gred_qopt *ctl;
  536. struct nlattr *tb[TCA_GRED_MAX + 1];
  537. int err, prio = GRED_DEF_PRIO;
  538. u8 *stab;
  539. u32 max_P;
  540. struct gred_sched_data *prealloc;
  541. err = nla_parse_nested_deprecated(tb, TCA_GRED_MAX, opt, gred_policy,
  542. extack);
  543. if (err < 0)
  544. return err;
  545. if (tb[TCA_GRED_PARMS] == NULL && tb[TCA_GRED_STAB] == NULL) {
  546. if (tb[TCA_GRED_LIMIT] != NULL)
  547. sch->limit = nla_get_u32(tb[TCA_GRED_LIMIT]);
  548. return gred_change_table_def(sch, tb[TCA_GRED_DPS], extack);
  549. }
  550. if (tb[TCA_GRED_PARMS] == NULL ||
  551. tb[TCA_GRED_STAB] == NULL ||
  552. tb[TCA_GRED_LIMIT] != NULL) {
  553. NL_SET_ERR_MSG_MOD(extack, "can't configure Qdisc and virtual queue at the same time");
  554. return -EINVAL;
  555. }
  556. max_P = tb[TCA_GRED_MAX_P] ? nla_get_u32(tb[TCA_GRED_MAX_P]) : 0;
  557. ctl = nla_data(tb[TCA_GRED_PARMS]);
  558. stab = nla_data(tb[TCA_GRED_STAB]);
  559. if (ctl->DP >= table->DPs) {
  560. NL_SET_ERR_MSG_MOD(extack, "virtual queue index above virtual queue count");
  561. return -EINVAL;
  562. }
  563. if (tb[TCA_GRED_VQ_LIST]) {
  564. err = gred_vqs_validate(table, ctl->DP, tb[TCA_GRED_VQ_LIST],
  565. extack);
  566. if (err)
  567. return err;
  568. }
  569. if (gred_rio_mode(table)) {
  570. if (ctl->prio == 0) {
  571. int def_prio = GRED_DEF_PRIO;
  572. if (table->tab[table->def])
  573. def_prio = table->tab[table->def]->prio;
  574. printk(KERN_DEBUG "GRED: DP %u does not have a prio "
  575. "setting default to %d\n", ctl->DP, def_prio);
  576. prio = def_prio;
  577. } else
  578. prio = ctl->prio;
  579. }
  580. prealloc = kzalloc(sizeof(*prealloc), GFP_KERNEL);
  581. sch_tree_lock(sch);
  582. err = gred_change_vq(sch, ctl->DP, ctl, prio, stab, max_P, &prealloc,
  583. extack);
  584. if (err < 0)
  585. goto err_unlock_free;
  586. if (tb[TCA_GRED_VQ_LIST])
  587. gred_vqs_apply(table, tb[TCA_GRED_VQ_LIST]);
  588. if (gred_rio_mode(table)) {
  589. gred_disable_wred_mode(table);
  590. if (gred_wred_mode_check(sch))
  591. gred_enable_wred_mode(table);
  592. }
  593. sch_tree_unlock(sch);
  594. kfree(prealloc);
  595. gred_offload(sch, TC_GRED_REPLACE);
  596. return 0;
  597. err_unlock_free:
  598. sch_tree_unlock(sch);
  599. kfree(prealloc);
  600. return err;
  601. }
  602. static int gred_init(struct Qdisc *sch, struct nlattr *opt,
  603. struct netlink_ext_ack *extack)
  604. {
  605. struct gred_sched *table = qdisc_priv(sch);
  606. struct nlattr *tb[TCA_GRED_MAX + 1];
  607. int err;
  608. if (!opt)
  609. return -EINVAL;
  610. err = nla_parse_nested_deprecated(tb, TCA_GRED_MAX, opt, gred_policy,
  611. extack);
  612. if (err < 0)
  613. return err;
  614. if (tb[TCA_GRED_PARMS] || tb[TCA_GRED_STAB]) {
  615. NL_SET_ERR_MSG_MOD(extack,
  616. "virtual queue configuration can't be specified at initialization time");
  617. return -EINVAL;
  618. }
  619. if (tb[TCA_GRED_LIMIT])
  620. sch->limit = nla_get_u32(tb[TCA_GRED_LIMIT]);
  621. else
  622. sch->limit = qdisc_dev(sch)->tx_queue_len
  623. * psched_mtu(qdisc_dev(sch));
  624. if (qdisc_dev(sch)->netdev_ops->ndo_setup_tc) {
  625. table->opt = kzalloc(sizeof(*table->opt), GFP_KERNEL);
  626. if (!table->opt)
  627. return -ENOMEM;
  628. }
  629. return gred_change_table_def(sch, tb[TCA_GRED_DPS], extack);
  630. }
  631. static int gred_dump(struct Qdisc *sch, struct sk_buff *skb)
  632. {
  633. struct gred_sched *table = qdisc_priv(sch);
  634. struct nlattr *parms, *vqs, *opts = NULL;
  635. int i;
  636. u32 max_p[MAX_DPs];
  637. struct tc_gred_sopt sopt = {
  638. .DPs = table->DPs,
  639. .def_DP = table->def,
  640. .grio = gred_rio_mode(table),
  641. .flags = table->red_flags,
  642. };
  643. if (gred_offload_dump_stats(sch))
  644. goto nla_put_failure;
  645. opts = nla_nest_start_noflag(skb, TCA_OPTIONS);
  646. if (opts == NULL)
  647. goto nla_put_failure;
  648. if (nla_put(skb, TCA_GRED_DPS, sizeof(sopt), &sopt))
  649. goto nla_put_failure;
  650. for (i = 0; i < MAX_DPs; i++) {
  651. struct gred_sched_data *q = table->tab[i];
  652. max_p[i] = q ? q->parms.max_P : 0;
  653. }
  654. if (nla_put(skb, TCA_GRED_MAX_P, sizeof(max_p), max_p))
  655. goto nla_put_failure;
  656. if (nla_put_u32(skb, TCA_GRED_LIMIT, sch->limit))
  657. goto nla_put_failure;
  658. /* Old style all-in-one dump of VQs */
  659. parms = nla_nest_start_noflag(skb, TCA_GRED_PARMS);
  660. if (parms == NULL)
  661. goto nla_put_failure;
  662. for (i = 0; i < MAX_DPs; i++) {
  663. struct gred_sched_data *q = table->tab[i];
  664. struct tc_gred_qopt opt;
  665. unsigned long qavg;
  666. memset(&opt, 0, sizeof(opt));
  667. if (!q) {
  668. /* hack -- fix at some point with proper message
  669. This is how we indicate to tc that there is no VQ
  670. at this DP */
  671. opt.DP = MAX_DPs + i;
  672. goto append_opt;
  673. }
  674. opt.limit = q->limit;
  675. opt.DP = q->DP;
  676. opt.backlog = gred_backlog(table, q, sch);
  677. opt.prio = q->prio;
  678. opt.qth_min = q->parms.qth_min >> q->parms.Wlog;
  679. opt.qth_max = q->parms.qth_max >> q->parms.Wlog;
  680. opt.Wlog = q->parms.Wlog;
  681. opt.Plog = q->parms.Plog;
  682. opt.Scell_log = q->parms.Scell_log;
  683. opt.early = q->stats.prob_drop;
  684. opt.forced = q->stats.forced_drop;
  685. opt.pdrop = q->stats.pdrop;
  686. opt.packets = q->packetsin;
  687. opt.bytesin = q->bytesin;
  688. if (gred_wred_mode(table))
  689. gred_load_wred_set(table, q);
  690. qavg = red_calc_qavg(&q->parms, &q->vars,
  691. q->vars.qavg >> q->parms.Wlog);
  692. opt.qave = qavg >> q->parms.Wlog;
  693. append_opt:
  694. if (nla_append(skb, sizeof(opt), &opt) < 0)
  695. goto nla_put_failure;
  696. }
  697. nla_nest_end(skb, parms);
  698. /* Dump the VQs again, in more structured way */
  699. vqs = nla_nest_start_noflag(skb, TCA_GRED_VQ_LIST);
  700. if (!vqs)
  701. goto nla_put_failure;
  702. for (i = 0; i < MAX_DPs; i++) {
  703. struct gred_sched_data *q = table->tab[i];
  704. struct nlattr *vq;
  705. if (!q)
  706. continue;
  707. vq = nla_nest_start_noflag(skb, TCA_GRED_VQ_ENTRY);
  708. if (!vq)
  709. goto nla_put_failure;
  710. if (nla_put_u32(skb, TCA_GRED_VQ_DP, q->DP))
  711. goto nla_put_failure;
  712. if (nla_put_u32(skb, TCA_GRED_VQ_FLAGS, q->red_flags))
  713. goto nla_put_failure;
  714. /* Stats */
  715. if (nla_put_u64_64bit(skb, TCA_GRED_VQ_STAT_BYTES, q->bytesin,
  716. TCA_GRED_VQ_PAD))
  717. goto nla_put_failure;
  718. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_PACKETS, q->packetsin))
  719. goto nla_put_failure;
  720. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_BACKLOG,
  721. gred_backlog(table, q, sch)))
  722. goto nla_put_failure;
  723. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_PROB_DROP,
  724. q->stats.prob_drop))
  725. goto nla_put_failure;
  726. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_PROB_MARK,
  727. q->stats.prob_mark))
  728. goto nla_put_failure;
  729. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_FORCED_DROP,
  730. q->stats.forced_drop))
  731. goto nla_put_failure;
  732. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_FORCED_MARK,
  733. q->stats.forced_mark))
  734. goto nla_put_failure;
  735. if (nla_put_u32(skb, TCA_GRED_VQ_STAT_PDROP, q->stats.pdrop))
  736. goto nla_put_failure;
  737. nla_nest_end(skb, vq);
  738. }
  739. nla_nest_end(skb, vqs);
  740. return nla_nest_end(skb, opts);
  741. nla_put_failure:
  742. nla_nest_cancel(skb, opts);
  743. return -EMSGSIZE;
  744. }
  745. static void gred_destroy(struct Qdisc *sch)
  746. {
  747. struct gred_sched *table = qdisc_priv(sch);
  748. int i;
  749. for (i = 0; i < table->DPs; i++)
  750. gred_destroy_vq(table->tab[i]);
  751. gred_offload(sch, TC_GRED_DESTROY);
  752. kfree(table->opt);
  753. }
  754. static struct Qdisc_ops gred_qdisc_ops __read_mostly = {
  755. .id = "gred",
  756. .priv_size = sizeof(struct gred_sched),
  757. .enqueue = gred_enqueue,
  758. .dequeue = gred_dequeue,
  759. .peek = qdisc_peek_head,
  760. .init = gred_init,
  761. .reset = gred_reset,
  762. .destroy = gred_destroy,
  763. .change = gred_change,
  764. .dump = gred_dump,
  765. .owner = THIS_MODULE,
  766. };
  767. static int __init gred_module_init(void)
  768. {
  769. return register_qdisc(&gred_qdisc_ops);
  770. }
  771. static void __exit gred_module_exit(void)
  772. {
  773. unregister_qdisc(&gred_qdisc_ops);
  774. }
  775. module_init(gred_module_init)
  776. module_exit(gred_module_exit)
  777. MODULE_LICENSE("GPL");