group.c 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959
  1. /*
  2. * net/tipc/group.c: TIPC group messaging code
  3. *
  4. * Copyright (c) 2017, Ericsson AB
  5. * Copyright (c) 2020, Red Hat Inc
  6. * All rights reserved.
  7. *
  8. * Redistribution and use in source and binary forms, with or without
  9. * modification, are permitted provided that the following conditions are met:
  10. *
  11. * 1. Redistributions of source code must retain the above copyright
  12. * notice, this list of conditions and the following disclaimer.
  13. * 2. Redistributions in binary form must reproduce the above copyright
  14. * notice, this list of conditions and the following disclaimer in the
  15. * documentation and/or other materials provided with the distribution.
  16. * 3. Neither the names of the copyright holders nor the names of its
  17. * contributors may be used to endorse or promote products derived from
  18. * this software without specific prior written permission.
  19. *
  20. * Alternatively, this software may be distributed under the terms of the
  21. * GNU General Public License ("GPL") version 2 as published by the Free
  22. * Software Foundation.
  23. *
  24. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  25. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  26. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  28. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  30. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  31. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  32. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  33. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  34. * POSSIBILITY OF SUCH DAMAGE.
  35. */
  36. #include "core.h"
  37. #include "addr.h"
  38. #include "group.h"
  39. #include "bcast.h"
  40. #include "topsrv.h"
  41. #include "msg.h"
  42. #include "socket.h"
  43. #include "node.h"
  44. #include "name_table.h"
  45. #include "subscr.h"
  46. #define ADV_UNIT (((MAX_MSG_SIZE + MAX_H_SIZE) / FLOWCTL_BLK_SZ) + 1)
  47. #define ADV_IDLE ADV_UNIT
  48. #define ADV_ACTIVE (ADV_UNIT * 12)
  49. enum mbr_state {
  50. MBR_JOINING,
  51. MBR_PUBLISHED,
  52. MBR_JOINED,
  53. MBR_PENDING,
  54. MBR_ACTIVE,
  55. MBR_RECLAIMING,
  56. MBR_REMITTED,
  57. MBR_LEAVING
  58. };
  59. struct tipc_member {
  60. struct rb_node tree_node;
  61. struct list_head list;
  62. struct list_head small_win;
  63. struct sk_buff_head deferredq;
  64. struct tipc_group *group;
  65. u32 node;
  66. u32 port;
  67. u32 instance;
  68. enum mbr_state state;
  69. u16 advertised;
  70. u16 window;
  71. u16 bc_rcv_nxt;
  72. u16 bc_syncpt;
  73. u16 bc_acked;
  74. };
  75. struct tipc_group {
  76. struct rb_root members;
  77. struct list_head small_win;
  78. struct list_head pending;
  79. struct list_head active;
  80. struct tipc_nlist dests;
  81. struct net *net;
  82. int subid;
  83. u32 type;
  84. u32 instance;
  85. u32 scope;
  86. u32 portid;
  87. u16 member_cnt;
  88. u16 active_cnt;
  89. u16 max_active;
  90. u16 bc_snd_nxt;
  91. u16 bc_ackers;
  92. bool *open;
  93. bool loopback;
  94. bool events;
  95. };
  96. static void tipc_group_proto_xmit(struct tipc_group *grp, struct tipc_member *m,
  97. int mtyp, struct sk_buff_head *xmitq);
  98. static void tipc_group_open(struct tipc_member *m, bool *wakeup)
  99. {
  100. *wakeup = false;
  101. if (list_empty(&m->small_win))
  102. return;
  103. list_del_init(&m->small_win);
  104. *m->group->open = true;
  105. *wakeup = true;
  106. }
  107. static void tipc_group_decr_active(struct tipc_group *grp,
  108. struct tipc_member *m)
  109. {
  110. if (m->state == MBR_ACTIVE || m->state == MBR_RECLAIMING ||
  111. m->state == MBR_REMITTED)
  112. grp->active_cnt--;
  113. }
  114. static int tipc_group_rcvbuf_limit(struct tipc_group *grp)
  115. {
  116. int max_active, active_pool, idle_pool;
  117. int mcnt = grp->member_cnt + 1;
  118. /* Limit simultaneous reception from other members */
  119. max_active = min(mcnt / 8, 64);
  120. max_active = max(max_active, 16);
  121. grp->max_active = max_active;
  122. /* Reserve blocks for active and idle members */
  123. active_pool = max_active * ADV_ACTIVE;
  124. idle_pool = (mcnt - max_active) * ADV_IDLE;
  125. /* Scale to bytes, considering worst-case truesize/msgsize ratio */
  126. return (active_pool + idle_pool) * FLOWCTL_BLK_SZ * 4;
  127. }
  128. u16 tipc_group_bc_snd_nxt(struct tipc_group *grp)
  129. {
  130. return grp->bc_snd_nxt;
  131. }
  132. static bool tipc_group_is_receiver(struct tipc_member *m)
  133. {
  134. return m && m->state != MBR_JOINING && m->state != MBR_LEAVING;
  135. }
  136. static bool tipc_group_is_sender(struct tipc_member *m)
  137. {
  138. return m && m->state != MBR_JOINING && m->state != MBR_PUBLISHED;
  139. }
  140. u32 tipc_group_exclude(struct tipc_group *grp)
  141. {
  142. if (!grp->loopback)
  143. return grp->portid;
  144. return 0;
  145. }
  146. struct tipc_group *tipc_group_create(struct net *net, u32 portid,
  147. struct tipc_group_req *mreq,
  148. bool *group_is_open)
  149. {
  150. u32 filter = TIPC_SUB_PORTS | TIPC_SUB_NO_STATUS;
  151. bool global = mreq->scope != TIPC_NODE_SCOPE;
  152. struct tipc_group *grp;
  153. u32 type = mreq->type;
  154. grp = kzalloc(sizeof(*grp), GFP_ATOMIC);
  155. if (!grp)
  156. return NULL;
  157. tipc_nlist_init(&grp->dests, tipc_own_addr(net));
  158. INIT_LIST_HEAD(&grp->small_win);
  159. INIT_LIST_HEAD(&grp->active);
  160. INIT_LIST_HEAD(&grp->pending);
  161. grp->members = RB_ROOT;
  162. grp->net = net;
  163. grp->portid = portid;
  164. grp->type = type;
  165. grp->instance = mreq->instance;
  166. grp->scope = mreq->scope;
  167. grp->loopback = mreq->flags & TIPC_GROUP_LOOPBACK;
  168. grp->events = mreq->flags & TIPC_GROUP_MEMBER_EVTS;
  169. grp->open = group_is_open;
  170. *grp->open = false;
  171. filter |= global ? TIPC_SUB_CLUSTER_SCOPE : TIPC_SUB_NODE_SCOPE;
  172. if (tipc_topsrv_kern_subscr(net, portid, type, 0, ~0,
  173. filter, &grp->subid))
  174. return grp;
  175. kfree(grp);
  176. return NULL;
  177. }
  178. void tipc_group_join(struct net *net, struct tipc_group *grp, int *sk_rcvbuf)
  179. {
  180. struct rb_root *tree = &grp->members;
  181. struct tipc_member *m, *tmp;
  182. struct sk_buff_head xmitq;
  183. __skb_queue_head_init(&xmitq);
  184. rbtree_postorder_for_each_entry_safe(m, tmp, tree, tree_node) {
  185. tipc_group_proto_xmit(grp, m, GRP_JOIN_MSG, &xmitq);
  186. tipc_group_update_member(m, 0);
  187. }
  188. tipc_node_distr_xmit(net, &xmitq);
  189. *sk_rcvbuf = tipc_group_rcvbuf_limit(grp);
  190. }
  191. void tipc_group_delete(struct net *net, struct tipc_group *grp)
  192. {
  193. struct rb_root *tree = &grp->members;
  194. struct tipc_member *m, *tmp;
  195. struct sk_buff_head xmitq;
  196. __skb_queue_head_init(&xmitq);
  197. rbtree_postorder_for_each_entry_safe(m, tmp, tree, tree_node) {
  198. tipc_group_proto_xmit(grp, m, GRP_LEAVE_MSG, &xmitq);
  199. __skb_queue_purge(&m->deferredq);
  200. list_del(&m->list);
  201. kfree(m);
  202. }
  203. tipc_node_distr_xmit(net, &xmitq);
  204. tipc_nlist_purge(&grp->dests);
  205. tipc_topsrv_kern_unsubscr(net, grp->subid);
  206. kfree(grp);
  207. }
  208. static struct tipc_member *tipc_group_find_member(struct tipc_group *grp,
  209. u32 node, u32 port)
  210. {
  211. struct rb_node *n = grp->members.rb_node;
  212. u64 nkey, key = (u64)node << 32 | port;
  213. struct tipc_member *m;
  214. while (n) {
  215. m = container_of(n, struct tipc_member, tree_node);
  216. nkey = (u64)m->node << 32 | m->port;
  217. if (key < nkey)
  218. n = n->rb_left;
  219. else if (key > nkey)
  220. n = n->rb_right;
  221. else
  222. return m;
  223. }
  224. return NULL;
  225. }
  226. static struct tipc_member *tipc_group_find_dest(struct tipc_group *grp,
  227. u32 node, u32 port)
  228. {
  229. struct tipc_member *m;
  230. m = tipc_group_find_member(grp, node, port);
  231. if (m && tipc_group_is_receiver(m))
  232. return m;
  233. return NULL;
  234. }
  235. static struct tipc_member *tipc_group_find_node(struct tipc_group *grp,
  236. u32 node)
  237. {
  238. struct tipc_member *m;
  239. struct rb_node *n;
  240. for (n = rb_first(&grp->members); n; n = rb_next(n)) {
  241. m = container_of(n, struct tipc_member, tree_node);
  242. if (m->node == node)
  243. return m;
  244. }
  245. return NULL;
  246. }
  247. static int tipc_group_add_to_tree(struct tipc_group *grp,
  248. struct tipc_member *m)
  249. {
  250. u64 nkey, key = (u64)m->node << 32 | m->port;
  251. struct rb_node **n, *parent = NULL;
  252. struct tipc_member *tmp;
  253. n = &grp->members.rb_node;
  254. while (*n) {
  255. tmp = container_of(*n, struct tipc_member, tree_node);
  256. parent = *n;
  257. tmp = container_of(parent, struct tipc_member, tree_node);
  258. nkey = (u64)tmp->node << 32 | tmp->port;
  259. if (key < nkey)
  260. n = &(*n)->rb_left;
  261. else if (key > nkey)
  262. n = &(*n)->rb_right;
  263. else
  264. return -EEXIST;
  265. }
  266. rb_link_node(&m->tree_node, parent, n);
  267. rb_insert_color(&m->tree_node, &grp->members);
  268. return 0;
  269. }
  270. static struct tipc_member *tipc_group_create_member(struct tipc_group *grp,
  271. u32 node, u32 port,
  272. u32 instance, int state)
  273. {
  274. struct tipc_member *m;
  275. int ret;
  276. m = kzalloc(sizeof(*m), GFP_ATOMIC);
  277. if (!m)
  278. return NULL;
  279. INIT_LIST_HEAD(&m->list);
  280. INIT_LIST_HEAD(&m->small_win);
  281. __skb_queue_head_init(&m->deferredq);
  282. m->group = grp;
  283. m->node = node;
  284. m->port = port;
  285. m->instance = instance;
  286. m->bc_acked = grp->bc_snd_nxt - 1;
  287. ret = tipc_group_add_to_tree(grp, m);
  288. if (ret < 0) {
  289. kfree(m);
  290. return NULL;
  291. }
  292. grp->member_cnt++;
  293. tipc_nlist_add(&grp->dests, m->node);
  294. m->state = state;
  295. return m;
  296. }
  297. void tipc_group_add_member(struct tipc_group *grp, u32 node,
  298. u32 port, u32 instance)
  299. {
  300. tipc_group_create_member(grp, node, port, instance, MBR_PUBLISHED);
  301. }
  302. static void tipc_group_delete_member(struct tipc_group *grp,
  303. struct tipc_member *m)
  304. {
  305. rb_erase(&m->tree_node, &grp->members);
  306. grp->member_cnt--;
  307. /* Check if we were waiting for replicast ack from this member */
  308. if (grp->bc_ackers && less(m->bc_acked, grp->bc_snd_nxt - 1))
  309. grp->bc_ackers--;
  310. list_del_init(&m->list);
  311. list_del_init(&m->small_win);
  312. tipc_group_decr_active(grp, m);
  313. /* If last member on a node, remove node from dest list */
  314. if (!tipc_group_find_node(grp, m->node))
  315. tipc_nlist_del(&grp->dests, m->node);
  316. kfree(m);
  317. }
  318. struct tipc_nlist *tipc_group_dests(struct tipc_group *grp)
  319. {
  320. return &grp->dests;
  321. }
  322. void tipc_group_self(struct tipc_group *grp, struct tipc_service_range *seq,
  323. int *scope)
  324. {
  325. seq->type = grp->type;
  326. seq->lower = grp->instance;
  327. seq->upper = grp->instance;
  328. *scope = grp->scope;
  329. }
  330. void tipc_group_update_member(struct tipc_member *m, int len)
  331. {
  332. struct tipc_group *grp = m->group;
  333. struct tipc_member *_m, *tmp;
  334. if (!tipc_group_is_receiver(m))
  335. return;
  336. m->window -= len;
  337. if (m->window >= ADV_IDLE)
  338. return;
  339. list_del_init(&m->small_win);
  340. /* Sort member into small_window members' list */
  341. list_for_each_entry_safe(_m, tmp, &grp->small_win, small_win) {
  342. if (_m->window > m->window)
  343. break;
  344. }
  345. list_add_tail(&m->small_win, &_m->small_win);
  346. }
  347. void tipc_group_update_bc_members(struct tipc_group *grp, int len, bool ack)
  348. {
  349. u16 prev = grp->bc_snd_nxt - 1;
  350. struct tipc_member *m;
  351. struct rb_node *n;
  352. u16 ackers = 0;
  353. for (n = rb_first(&grp->members); n; n = rb_next(n)) {
  354. m = container_of(n, struct tipc_member, tree_node);
  355. if (tipc_group_is_receiver(m)) {
  356. tipc_group_update_member(m, len);
  357. m->bc_acked = prev;
  358. ackers++;
  359. }
  360. }
  361. /* Mark number of acknowledges to expect, if any */
  362. if (ack)
  363. grp->bc_ackers = ackers;
  364. grp->bc_snd_nxt++;
  365. }
  366. bool tipc_group_cong(struct tipc_group *grp, u32 dnode, u32 dport,
  367. int len, struct tipc_member **mbr)
  368. {
  369. struct sk_buff_head xmitq;
  370. struct tipc_member *m;
  371. int adv, state;
  372. m = tipc_group_find_dest(grp, dnode, dport);
  373. if (!tipc_group_is_receiver(m)) {
  374. *mbr = NULL;
  375. return false;
  376. }
  377. *mbr = m;
  378. if (m->window >= len)
  379. return false;
  380. *grp->open = false;
  381. /* If not fully advertised, do it now to prevent mutual blocking */
  382. adv = m->advertised;
  383. state = m->state;
  384. if (state == MBR_JOINED && adv == ADV_IDLE)
  385. return true;
  386. if (state == MBR_ACTIVE && adv == ADV_ACTIVE)
  387. return true;
  388. if (state == MBR_PENDING && adv == ADV_IDLE)
  389. return true;
  390. __skb_queue_head_init(&xmitq);
  391. tipc_group_proto_xmit(grp, m, GRP_ADV_MSG, &xmitq);
  392. tipc_node_distr_xmit(grp->net, &xmitq);
  393. return true;
  394. }
  395. bool tipc_group_bc_cong(struct tipc_group *grp, int len)
  396. {
  397. struct tipc_member *m = NULL;
  398. /* If prev bcast was replicast, reject until all receivers have acked */
  399. if (grp->bc_ackers) {
  400. *grp->open = false;
  401. return true;
  402. }
  403. if (list_empty(&grp->small_win))
  404. return false;
  405. m = list_first_entry(&grp->small_win, struct tipc_member, small_win);
  406. if (m->window >= len)
  407. return false;
  408. return tipc_group_cong(grp, m->node, m->port, len, &m);
  409. }
  410. /* tipc_group_sort_msg() - sort msg into queue by bcast sequence number
  411. */
  412. static void tipc_group_sort_msg(struct sk_buff *skb, struct sk_buff_head *defq)
  413. {
  414. struct tipc_msg *_hdr, *hdr = buf_msg(skb);
  415. u16 bc_seqno = msg_grp_bc_seqno(hdr);
  416. struct sk_buff *_skb, *tmp;
  417. int mtyp = msg_type(hdr);
  418. /* Bcast/mcast may be bypassed by ucast or other bcast, - sort it in */
  419. if (mtyp == TIPC_GRP_BCAST_MSG || mtyp == TIPC_GRP_MCAST_MSG) {
  420. skb_queue_walk_safe(defq, _skb, tmp) {
  421. _hdr = buf_msg(_skb);
  422. if (!less(bc_seqno, msg_grp_bc_seqno(_hdr)))
  423. continue;
  424. __skb_queue_before(defq, _skb, skb);
  425. return;
  426. }
  427. /* Bcast was not bypassed, - add to tail */
  428. }
  429. /* Unicasts are never bypassed, - always add to tail */
  430. __skb_queue_tail(defq, skb);
  431. }
  432. /* tipc_group_filter_msg() - determine if we should accept arriving message
  433. */
  434. void tipc_group_filter_msg(struct tipc_group *grp, struct sk_buff_head *inputq,
  435. struct sk_buff_head *xmitq)
  436. {
  437. struct sk_buff *skb = __skb_dequeue(inputq);
  438. bool ack, deliver, update, leave = false;
  439. struct sk_buff_head *defq;
  440. struct tipc_member *m;
  441. struct tipc_msg *hdr;
  442. u32 node, port;
  443. int mtyp, blks;
  444. if (!skb)
  445. return;
  446. hdr = buf_msg(skb);
  447. node = msg_orignode(hdr);
  448. port = msg_origport(hdr);
  449. if (!msg_in_group(hdr))
  450. goto drop;
  451. m = tipc_group_find_member(grp, node, port);
  452. if (!tipc_group_is_sender(m))
  453. goto drop;
  454. if (less(msg_grp_bc_seqno(hdr), m->bc_rcv_nxt))
  455. goto drop;
  456. TIPC_SKB_CB(skb)->orig_member = m->instance;
  457. defq = &m->deferredq;
  458. tipc_group_sort_msg(skb, defq);
  459. while ((skb = skb_peek(defq))) {
  460. hdr = buf_msg(skb);
  461. mtyp = msg_type(hdr);
  462. blks = msg_blocks(hdr);
  463. deliver = true;
  464. ack = false;
  465. update = false;
  466. if (more(msg_grp_bc_seqno(hdr), m->bc_rcv_nxt))
  467. break;
  468. /* Decide what to do with message */
  469. switch (mtyp) {
  470. case TIPC_GRP_MCAST_MSG:
  471. if (msg_nameinst(hdr) != grp->instance) {
  472. update = true;
  473. deliver = false;
  474. }
  475. fallthrough;
  476. case TIPC_GRP_BCAST_MSG:
  477. m->bc_rcv_nxt++;
  478. ack = msg_grp_bc_ack_req(hdr);
  479. break;
  480. case TIPC_GRP_UCAST_MSG:
  481. break;
  482. case TIPC_GRP_MEMBER_EVT:
  483. if (m->state == MBR_LEAVING)
  484. leave = true;
  485. if (!grp->events)
  486. deliver = false;
  487. break;
  488. default:
  489. break;
  490. }
  491. /* Execute decisions */
  492. __skb_dequeue(defq);
  493. if (deliver)
  494. __skb_queue_tail(inputq, skb);
  495. else
  496. kfree_skb(skb);
  497. if (ack)
  498. tipc_group_proto_xmit(grp, m, GRP_ACK_MSG, xmitq);
  499. if (leave) {
  500. __skb_queue_purge(defq);
  501. tipc_group_delete_member(grp, m);
  502. break;
  503. }
  504. if (!update)
  505. continue;
  506. tipc_group_update_rcv_win(grp, blks, node, port, xmitq);
  507. }
  508. return;
  509. drop:
  510. kfree_skb(skb);
  511. }
  512. void tipc_group_update_rcv_win(struct tipc_group *grp, int blks, u32 node,
  513. u32 port, struct sk_buff_head *xmitq)
  514. {
  515. struct list_head *active = &grp->active;
  516. int max_active = grp->max_active;
  517. int reclaim_limit = max_active * 3 / 4;
  518. int active_cnt = grp->active_cnt;
  519. struct tipc_member *m, *rm, *pm;
  520. m = tipc_group_find_member(grp, node, port);
  521. if (!m)
  522. return;
  523. m->advertised -= blks;
  524. switch (m->state) {
  525. case MBR_JOINED:
  526. /* First, decide if member can go active */
  527. if (active_cnt <= max_active) {
  528. m->state = MBR_ACTIVE;
  529. list_add_tail(&m->list, active);
  530. grp->active_cnt++;
  531. tipc_group_proto_xmit(grp, m, GRP_ADV_MSG, xmitq);
  532. } else {
  533. m->state = MBR_PENDING;
  534. list_add_tail(&m->list, &grp->pending);
  535. }
  536. if (active_cnt < reclaim_limit)
  537. break;
  538. /* Reclaim from oldest active member, if possible */
  539. if (!list_empty(active)) {
  540. rm = list_first_entry(active, struct tipc_member, list);
  541. rm->state = MBR_RECLAIMING;
  542. list_del_init(&rm->list);
  543. tipc_group_proto_xmit(grp, rm, GRP_RECLAIM_MSG, xmitq);
  544. break;
  545. }
  546. /* Nobody to reclaim from; - revert oldest pending to JOINED */
  547. pm = list_first_entry(&grp->pending, struct tipc_member, list);
  548. list_del_init(&pm->list);
  549. pm->state = MBR_JOINED;
  550. tipc_group_proto_xmit(grp, pm, GRP_ADV_MSG, xmitq);
  551. break;
  552. case MBR_ACTIVE:
  553. if (!list_is_last(&m->list, &grp->active))
  554. list_move_tail(&m->list, &grp->active);
  555. if (m->advertised > (ADV_ACTIVE * 3 / 4))
  556. break;
  557. tipc_group_proto_xmit(grp, m, GRP_ADV_MSG, xmitq);
  558. break;
  559. case MBR_REMITTED:
  560. if (m->advertised > ADV_IDLE)
  561. break;
  562. m->state = MBR_JOINED;
  563. grp->active_cnt--;
  564. if (m->advertised < ADV_IDLE) {
  565. pr_warn_ratelimited("Rcv unexpected msg after REMIT\n");
  566. tipc_group_proto_xmit(grp, m, GRP_ADV_MSG, xmitq);
  567. }
  568. if (list_empty(&grp->pending))
  569. return;
  570. /* Set oldest pending member to active and advertise */
  571. pm = list_first_entry(&grp->pending, struct tipc_member, list);
  572. pm->state = MBR_ACTIVE;
  573. list_move_tail(&pm->list, &grp->active);
  574. grp->active_cnt++;
  575. tipc_group_proto_xmit(grp, pm, GRP_ADV_MSG, xmitq);
  576. break;
  577. case MBR_RECLAIMING:
  578. case MBR_JOINING:
  579. case MBR_LEAVING:
  580. default:
  581. break;
  582. }
  583. }
  584. static void tipc_group_create_event(struct tipc_group *grp,
  585. struct tipc_member *m,
  586. u32 event, u16 seqno,
  587. struct sk_buff_head *inputq)
  588. { u32 dnode = tipc_own_addr(grp->net);
  589. struct tipc_event evt;
  590. struct sk_buff *skb;
  591. struct tipc_msg *hdr;
  592. memset(&evt, 0, sizeof(evt));
  593. evt.event = event;
  594. evt.found_lower = m->instance;
  595. evt.found_upper = m->instance;
  596. evt.port.ref = m->port;
  597. evt.port.node = m->node;
  598. evt.s.seq.type = grp->type;
  599. evt.s.seq.lower = m->instance;
  600. evt.s.seq.upper = m->instance;
  601. skb = tipc_msg_create(TIPC_CRITICAL_IMPORTANCE, TIPC_GRP_MEMBER_EVT,
  602. GROUP_H_SIZE, sizeof(evt), dnode, m->node,
  603. grp->portid, m->port, 0);
  604. if (!skb)
  605. return;
  606. hdr = buf_msg(skb);
  607. msg_set_nametype(hdr, grp->type);
  608. msg_set_grp_evt(hdr, event);
  609. msg_set_dest_droppable(hdr, true);
  610. msg_set_grp_bc_seqno(hdr, seqno);
  611. memcpy(msg_data(hdr), &evt, sizeof(evt));
  612. TIPC_SKB_CB(skb)->orig_member = m->instance;
  613. __skb_queue_tail(inputq, skb);
  614. }
  615. static void tipc_group_proto_xmit(struct tipc_group *grp, struct tipc_member *m,
  616. int mtyp, struct sk_buff_head *xmitq)
  617. {
  618. struct tipc_msg *hdr;
  619. struct sk_buff *skb;
  620. int adv = 0;
  621. skb = tipc_msg_create(GROUP_PROTOCOL, mtyp, INT_H_SIZE, 0,
  622. m->node, tipc_own_addr(grp->net),
  623. m->port, grp->portid, 0);
  624. if (!skb)
  625. return;
  626. if (m->state == MBR_ACTIVE)
  627. adv = ADV_ACTIVE - m->advertised;
  628. else if (m->state == MBR_JOINED || m->state == MBR_PENDING)
  629. adv = ADV_IDLE - m->advertised;
  630. hdr = buf_msg(skb);
  631. if (mtyp == GRP_JOIN_MSG) {
  632. msg_set_grp_bc_syncpt(hdr, grp->bc_snd_nxt);
  633. msg_set_adv_win(hdr, adv);
  634. m->advertised += adv;
  635. } else if (mtyp == GRP_LEAVE_MSG) {
  636. msg_set_grp_bc_syncpt(hdr, grp->bc_snd_nxt);
  637. } else if (mtyp == GRP_ADV_MSG) {
  638. msg_set_adv_win(hdr, adv);
  639. m->advertised += adv;
  640. } else if (mtyp == GRP_ACK_MSG) {
  641. msg_set_grp_bc_acked(hdr, m->bc_rcv_nxt);
  642. } else if (mtyp == GRP_REMIT_MSG) {
  643. msg_set_grp_remitted(hdr, m->window);
  644. }
  645. msg_set_dest_droppable(hdr, true);
  646. __skb_queue_tail(xmitq, skb);
  647. }
  648. void tipc_group_proto_rcv(struct tipc_group *grp, bool *usr_wakeup,
  649. struct tipc_msg *hdr, struct sk_buff_head *inputq,
  650. struct sk_buff_head *xmitq)
  651. {
  652. u32 node = msg_orignode(hdr);
  653. u32 port = msg_origport(hdr);
  654. struct tipc_member *m, *pm;
  655. u16 remitted, in_flight;
  656. if (!grp)
  657. return;
  658. if (grp->scope == TIPC_NODE_SCOPE && node != tipc_own_addr(grp->net))
  659. return;
  660. m = tipc_group_find_member(grp, node, port);
  661. switch (msg_type(hdr)) {
  662. case GRP_JOIN_MSG:
  663. if (!m)
  664. m = tipc_group_create_member(grp, node, port,
  665. 0, MBR_JOINING);
  666. if (!m)
  667. return;
  668. m->bc_syncpt = msg_grp_bc_syncpt(hdr);
  669. m->bc_rcv_nxt = m->bc_syncpt;
  670. m->window += msg_adv_win(hdr);
  671. /* Wait until PUBLISH event is received if necessary */
  672. if (m->state != MBR_PUBLISHED)
  673. return;
  674. /* Member can be taken into service */
  675. m->state = MBR_JOINED;
  676. tipc_group_open(m, usr_wakeup);
  677. tipc_group_update_member(m, 0);
  678. tipc_group_proto_xmit(grp, m, GRP_ADV_MSG, xmitq);
  679. tipc_group_create_event(grp, m, TIPC_PUBLISHED,
  680. m->bc_syncpt, inputq);
  681. return;
  682. case GRP_LEAVE_MSG:
  683. if (!m)
  684. return;
  685. m->bc_syncpt = msg_grp_bc_syncpt(hdr);
  686. list_del_init(&m->list);
  687. tipc_group_open(m, usr_wakeup);
  688. tipc_group_decr_active(grp, m);
  689. m->state = MBR_LEAVING;
  690. tipc_group_create_event(grp, m, TIPC_WITHDRAWN,
  691. m->bc_syncpt, inputq);
  692. return;
  693. case GRP_ADV_MSG:
  694. if (!m)
  695. return;
  696. m->window += msg_adv_win(hdr);
  697. tipc_group_open(m, usr_wakeup);
  698. return;
  699. case GRP_ACK_MSG:
  700. if (!m)
  701. return;
  702. m->bc_acked = msg_grp_bc_acked(hdr);
  703. if (--grp->bc_ackers)
  704. return;
  705. list_del_init(&m->small_win);
  706. *m->group->open = true;
  707. *usr_wakeup = true;
  708. tipc_group_update_member(m, 0);
  709. return;
  710. case GRP_RECLAIM_MSG:
  711. if (!m)
  712. return;
  713. tipc_group_proto_xmit(grp, m, GRP_REMIT_MSG, xmitq);
  714. m->window = ADV_IDLE;
  715. tipc_group_open(m, usr_wakeup);
  716. return;
  717. case GRP_REMIT_MSG:
  718. if (!m || m->state != MBR_RECLAIMING)
  719. return;
  720. remitted = msg_grp_remitted(hdr);
  721. /* Messages preceding the REMIT still in receive queue */
  722. if (m->advertised > remitted) {
  723. m->state = MBR_REMITTED;
  724. in_flight = m->advertised - remitted;
  725. m->advertised = ADV_IDLE + in_flight;
  726. return;
  727. }
  728. /* This should never happen */
  729. if (m->advertised < remitted)
  730. pr_warn_ratelimited("Unexpected REMIT msg\n");
  731. /* All messages preceding the REMIT have been read */
  732. m->state = MBR_JOINED;
  733. grp->active_cnt--;
  734. m->advertised = ADV_IDLE;
  735. /* Set oldest pending member to active and advertise */
  736. if (list_empty(&grp->pending))
  737. return;
  738. pm = list_first_entry(&grp->pending, struct tipc_member, list);
  739. pm->state = MBR_ACTIVE;
  740. list_move_tail(&pm->list, &grp->active);
  741. grp->active_cnt++;
  742. if (pm->advertised <= (ADV_ACTIVE * 3 / 4))
  743. tipc_group_proto_xmit(grp, pm, GRP_ADV_MSG, xmitq);
  744. return;
  745. default:
  746. pr_warn("Received unknown GROUP_PROTO message\n");
  747. }
  748. }
  749. /* tipc_group_member_evt() - receive and handle a member up/down event
  750. */
  751. void tipc_group_member_evt(struct tipc_group *grp,
  752. bool *usr_wakeup,
  753. int *sk_rcvbuf,
  754. struct tipc_msg *hdr,
  755. struct sk_buff_head *inputq,
  756. struct sk_buff_head *xmitq)
  757. {
  758. struct tipc_event *evt = (void *)msg_data(hdr);
  759. u32 instance = evt->found_lower;
  760. u32 node = evt->port.node;
  761. u32 port = evt->port.ref;
  762. int event = evt->event;
  763. struct tipc_member *m;
  764. struct net *net;
  765. u32 self;
  766. if (!grp)
  767. return;
  768. net = grp->net;
  769. self = tipc_own_addr(net);
  770. if (!grp->loopback && node == self && port == grp->portid)
  771. return;
  772. m = tipc_group_find_member(grp, node, port);
  773. switch (event) {
  774. case TIPC_PUBLISHED:
  775. /* Send and wait for arrival of JOIN message if necessary */
  776. if (!m) {
  777. m = tipc_group_create_member(grp, node, port, instance,
  778. MBR_PUBLISHED);
  779. if (!m)
  780. break;
  781. tipc_group_update_member(m, 0);
  782. tipc_group_proto_xmit(grp, m, GRP_JOIN_MSG, xmitq);
  783. break;
  784. }
  785. if (m->state != MBR_JOINING)
  786. break;
  787. /* Member can be taken into service */
  788. m->instance = instance;
  789. m->state = MBR_JOINED;
  790. tipc_group_open(m, usr_wakeup);
  791. tipc_group_update_member(m, 0);
  792. tipc_group_proto_xmit(grp, m, GRP_JOIN_MSG, xmitq);
  793. tipc_group_create_event(grp, m, TIPC_PUBLISHED,
  794. m->bc_syncpt, inputq);
  795. break;
  796. case TIPC_WITHDRAWN:
  797. if (!m)
  798. break;
  799. tipc_group_decr_active(grp, m);
  800. m->state = MBR_LEAVING;
  801. list_del_init(&m->list);
  802. tipc_group_open(m, usr_wakeup);
  803. /* Only send event if no LEAVE message can be expected */
  804. if (!tipc_node_is_up(net, node))
  805. tipc_group_create_event(grp, m, TIPC_WITHDRAWN,
  806. m->bc_rcv_nxt, inputq);
  807. break;
  808. default:
  809. break;
  810. }
  811. *sk_rcvbuf = tipc_group_rcvbuf_limit(grp);
  812. }
  813. int tipc_group_fill_sock_diag(struct tipc_group *grp, struct sk_buff *skb)
  814. {
  815. struct nlattr *group = nla_nest_start_noflag(skb, TIPC_NLA_SOCK_GROUP);
  816. if (!group)
  817. return -EMSGSIZE;
  818. if (nla_put_u32(skb, TIPC_NLA_SOCK_GROUP_ID,
  819. grp->type) ||
  820. nla_put_u32(skb, TIPC_NLA_SOCK_GROUP_INSTANCE,
  821. grp->instance) ||
  822. nla_put_u32(skb, TIPC_NLA_SOCK_GROUP_BC_SEND_NEXT,
  823. grp->bc_snd_nxt))
  824. goto group_msg_cancel;
  825. if (grp->scope == TIPC_NODE_SCOPE)
  826. if (nla_put_flag(skb, TIPC_NLA_SOCK_GROUP_NODE_SCOPE))
  827. goto group_msg_cancel;
  828. if (grp->scope == TIPC_CLUSTER_SCOPE)
  829. if (nla_put_flag(skb, TIPC_NLA_SOCK_GROUP_CLUSTER_SCOPE))
  830. goto group_msg_cancel;
  831. if (*grp->open)
  832. if (nla_put_flag(skb, TIPC_NLA_SOCK_GROUP_OPEN))
  833. goto group_msg_cancel;
  834. nla_nest_end(skb, group);
  835. return 0;
  836. group_msg_cancel:
  837. nla_nest_cancel(skb, group);
  838. return -1;
  839. }