br_mdb.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493
  1. #include <linux/err.h>
  2. #include <linux/igmp.h>
  3. #include <linux/kernel.h>
  4. #include <linux/netdevice.h>
  5. #include <linux/rculist.h>
  6. #include <linux/skbuff.h>
  7. #include <linux/if_ether.h>
  8. #include <net/ip.h>
  9. #include <net/netlink.h>
  10. #if IS_ENABLED(CONFIG_IPV6)
  11. #include <net/ipv6.h>
  12. #endif
  13. #include "br_private.h"
  14. static int br_rports_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
  15. struct net_device *dev)
  16. {
  17. struct net_bridge *br = netdev_priv(dev);
  18. struct net_bridge_port *p;
  19. struct hlist_node *n;
  20. struct nlattr *nest;
  21. if (!br->multicast_router || hlist_empty(&br->router_list))
  22. return 0;
  23. nest = nla_nest_start(skb, MDBA_ROUTER);
  24. if (nest == NULL)
  25. return -EMSGSIZE;
  26. hlist_for_each_entry_rcu(p, n, &br->router_list, rlist) {
  27. if (p && nla_put_u32(skb, MDBA_ROUTER_PORT, p->dev->ifindex))
  28. goto fail;
  29. }
  30. nla_nest_end(skb, nest);
  31. return 0;
  32. fail:
  33. nla_nest_cancel(skb, nest);
  34. return -EMSGSIZE;
  35. }
  36. static int br_mdb_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
  37. struct net_device *dev)
  38. {
  39. struct net_bridge *br = netdev_priv(dev);
  40. struct net_bridge_mdb_htable *mdb;
  41. struct nlattr *nest, *nest2;
  42. int i, err = 0;
  43. int idx = 0, s_idx = cb->args[1];
  44. if (br->multicast_disabled)
  45. return 0;
  46. mdb = rcu_dereference(br->mdb);
  47. if (!mdb)
  48. return 0;
  49. nest = nla_nest_start(skb, MDBA_MDB);
  50. if (nest == NULL)
  51. return -EMSGSIZE;
  52. for (i = 0; i < mdb->max; i++) {
  53. struct hlist_node *h;
  54. struct net_bridge_mdb_entry *mp;
  55. struct net_bridge_port_group *p, **pp;
  56. struct net_bridge_port *port;
  57. hlist_for_each_entry_rcu(mp, h, &mdb->mhash[i], hlist[mdb->ver]) {
  58. if (idx < s_idx)
  59. goto skip;
  60. nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
  61. if (nest2 == NULL) {
  62. err = -EMSGSIZE;
  63. goto out;
  64. }
  65. for (pp = &mp->ports;
  66. (p = rcu_dereference(*pp)) != NULL;
  67. pp = &p->next) {
  68. port = p->port;
  69. if (port) {
  70. struct br_mdb_entry e;
  71. e.ifindex = port->dev->ifindex;
  72. e.state = p->state;
  73. if (p->addr.proto == htons(ETH_P_IP))
  74. e.addr.u.ip4 = p->addr.u.ip4;
  75. #if IS_ENABLED(CONFIG_IPV6)
  76. if (p->addr.proto == htons(ETH_P_IPV6))
  77. e.addr.u.ip6 = p->addr.u.ip6;
  78. #endif
  79. e.addr.proto = p->addr.proto;
  80. if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(e), &e)) {
  81. nla_nest_cancel(skb, nest2);
  82. err = -EMSGSIZE;
  83. goto out;
  84. }
  85. }
  86. }
  87. nla_nest_end(skb, nest2);
  88. skip:
  89. idx++;
  90. }
  91. }
  92. out:
  93. cb->args[1] = idx;
  94. nla_nest_end(skb, nest);
  95. return err;
  96. }
  97. static int br_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
  98. {
  99. struct net_device *dev;
  100. struct net *net = sock_net(skb->sk);
  101. struct nlmsghdr *nlh = NULL;
  102. int idx = 0, s_idx;
  103. s_idx = cb->args[0];
  104. rcu_read_lock();
  105. /* In theory this could be wrapped to 0... */
  106. cb->seq = net->dev_base_seq + br_mdb_rehash_seq;
  107. for_each_netdev_rcu(net, dev) {
  108. if (dev->priv_flags & IFF_EBRIDGE) {
  109. struct br_port_msg *bpm;
  110. if (idx < s_idx)
  111. goto skip;
  112. nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid,
  113. cb->nlh->nlmsg_seq, RTM_GETMDB,
  114. sizeof(*bpm), NLM_F_MULTI);
  115. if (nlh == NULL)
  116. break;
  117. bpm = nlmsg_data(nlh);
  118. bpm->ifindex = dev->ifindex;
  119. if (br_mdb_fill_info(skb, cb, dev) < 0)
  120. goto out;
  121. if (br_rports_fill_info(skb, cb, dev) < 0)
  122. goto out;
  123. cb->args[1] = 0;
  124. nlmsg_end(skb, nlh);
  125. skip:
  126. idx++;
  127. }
  128. }
  129. out:
  130. if (nlh)
  131. nlmsg_end(skb, nlh);
  132. rcu_read_unlock();
  133. cb->args[0] = idx;
  134. return skb->len;
  135. }
  136. static int nlmsg_populate_mdb_fill(struct sk_buff *skb,
  137. struct net_device *dev,
  138. struct br_mdb_entry *entry, u32 pid,
  139. u32 seq, int type, unsigned int flags)
  140. {
  141. struct nlmsghdr *nlh;
  142. struct br_port_msg *bpm;
  143. struct nlattr *nest, *nest2;
  144. nlh = nlmsg_put(skb, pid, seq, type, sizeof(*bpm), NLM_F_MULTI);
  145. if (!nlh)
  146. return -EMSGSIZE;
  147. bpm = nlmsg_data(nlh);
  148. bpm->family = AF_BRIDGE;
  149. bpm->ifindex = dev->ifindex;
  150. nest = nla_nest_start(skb, MDBA_MDB);
  151. if (nest == NULL)
  152. goto cancel;
  153. nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
  154. if (nest2 == NULL)
  155. goto end;
  156. if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(*entry), entry))
  157. goto end;
  158. nla_nest_end(skb, nest2);
  159. nla_nest_end(skb, nest);
  160. return nlmsg_end(skb, nlh);
  161. end:
  162. nla_nest_end(skb, nest);
  163. cancel:
  164. nlmsg_cancel(skb, nlh);
  165. return -EMSGSIZE;
  166. }
  167. static inline size_t rtnl_mdb_nlmsg_size(void)
  168. {
  169. return NLMSG_ALIGN(sizeof(struct br_port_msg))
  170. + nla_total_size(sizeof(struct br_mdb_entry));
  171. }
  172. static void __br_mdb_notify(struct net_device *dev, struct br_mdb_entry *entry,
  173. int type)
  174. {
  175. struct net *net = dev_net(dev);
  176. struct sk_buff *skb;
  177. int err = -ENOBUFS;
  178. skb = nlmsg_new(rtnl_mdb_nlmsg_size(), GFP_ATOMIC);
  179. if (!skb)
  180. goto errout;
  181. err = nlmsg_populate_mdb_fill(skb, dev, entry, 0, 0, type, NTF_SELF);
  182. if (err < 0) {
  183. kfree_skb(skb);
  184. goto errout;
  185. }
  186. rtnl_notify(skb, net, 0, RTNLGRP_MDB, NULL, GFP_ATOMIC);
  187. return;
  188. errout:
  189. rtnl_set_sk_err(net, RTNLGRP_MDB, err);
  190. }
  191. void br_mdb_notify(struct net_device *dev, struct net_bridge_port *port,
  192. struct br_ip *group, int type)
  193. {
  194. struct br_mdb_entry entry;
  195. entry.ifindex = port->dev->ifindex;
  196. entry.addr.proto = group->proto;
  197. entry.addr.u.ip4 = group->u.ip4;
  198. #if IS_ENABLED(CONFIG_IPV6)
  199. entry.addr.u.ip6 = group->u.ip6;
  200. #endif
  201. __br_mdb_notify(dev, &entry, type);
  202. }
  203. static bool is_valid_mdb_entry(struct br_mdb_entry *entry)
  204. {
  205. if (entry->ifindex == 0)
  206. return false;
  207. if (entry->addr.proto == htons(ETH_P_IP)) {
  208. if (!ipv4_is_multicast(entry->addr.u.ip4))
  209. return false;
  210. if (ipv4_is_local_multicast(entry->addr.u.ip4))
  211. return false;
  212. #if IS_ENABLED(CONFIG_IPV6)
  213. } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
  214. if (!ipv6_is_transient_multicast(&entry->addr.u.ip6))
  215. return false;
  216. #endif
  217. } else
  218. return false;
  219. if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY)
  220. return false;
  221. return true;
  222. }
  223. static int br_mdb_parse(struct sk_buff *skb, struct nlmsghdr *nlh,
  224. struct net_device **pdev, struct br_mdb_entry **pentry)
  225. {
  226. struct net *net = sock_net(skb->sk);
  227. struct br_mdb_entry *entry;
  228. struct br_port_msg *bpm;
  229. struct nlattr *tb[MDBA_SET_ENTRY_MAX+1];
  230. struct net_device *dev;
  231. int err;
  232. if (!capable(CAP_NET_ADMIN))
  233. return -EPERM;
  234. err = nlmsg_parse(nlh, sizeof(*bpm), tb, MDBA_SET_ENTRY, NULL);
  235. if (err < 0)
  236. return err;
  237. bpm = nlmsg_data(nlh);
  238. if (bpm->ifindex == 0) {
  239. pr_info("PF_BRIDGE: br_mdb_parse() with invalid ifindex\n");
  240. return -EINVAL;
  241. }
  242. dev = __dev_get_by_index(net, bpm->ifindex);
  243. if (dev == NULL) {
  244. pr_info("PF_BRIDGE: br_mdb_parse() with unknown ifindex\n");
  245. return -ENODEV;
  246. }
  247. if (!(dev->priv_flags & IFF_EBRIDGE)) {
  248. pr_info("PF_BRIDGE: br_mdb_parse() with non-bridge\n");
  249. return -EOPNOTSUPP;
  250. }
  251. *pdev = dev;
  252. if (!tb[MDBA_SET_ENTRY] ||
  253. nla_len(tb[MDBA_SET_ENTRY]) != sizeof(struct br_mdb_entry)) {
  254. pr_info("PF_BRIDGE: br_mdb_parse() with invalid attr\n");
  255. return -EINVAL;
  256. }
  257. entry = nla_data(tb[MDBA_SET_ENTRY]);
  258. if (!is_valid_mdb_entry(entry)) {
  259. pr_info("PF_BRIDGE: br_mdb_parse() with invalid entry\n");
  260. return -EINVAL;
  261. }
  262. *pentry = entry;
  263. return 0;
  264. }
  265. static int br_mdb_add_group(struct net_bridge *br, struct net_bridge_port *port,
  266. struct br_ip *group, unsigned char state)
  267. {
  268. struct net_bridge_mdb_entry *mp;
  269. struct net_bridge_port_group *p;
  270. struct net_bridge_port_group __rcu **pp;
  271. struct net_bridge_mdb_htable *mdb;
  272. int err;
  273. mdb = mlock_dereference(br->mdb, br);
  274. mp = br_mdb_ip_get(mdb, group);
  275. if (!mp) {
  276. mp = br_multicast_new_group(br, port, group);
  277. err = PTR_ERR(mp);
  278. if (IS_ERR(mp))
  279. return err;
  280. }
  281. for (pp = &mp->ports;
  282. (p = mlock_dereference(*pp, br)) != NULL;
  283. pp = &p->next) {
  284. if (p->port == port)
  285. return -EEXIST;
  286. if ((unsigned long)p->port < (unsigned long)port)
  287. break;
  288. }
  289. p = br_multicast_new_port_group(port, group, *pp, state);
  290. if (unlikely(!p))
  291. return -ENOMEM;
  292. rcu_assign_pointer(*pp, p);
  293. br_mdb_notify(br->dev, port, group, RTM_NEWMDB);
  294. return 0;
  295. }
  296. static int __br_mdb_add(struct net *net, struct net_bridge *br,
  297. struct br_mdb_entry *entry)
  298. {
  299. struct br_ip ip;
  300. struct net_device *dev;
  301. struct net_bridge_port *p;
  302. int ret;
  303. if (!netif_running(br->dev) || br->multicast_disabled)
  304. return -EINVAL;
  305. dev = __dev_get_by_index(net, entry->ifindex);
  306. if (!dev)
  307. return -ENODEV;
  308. p = br_port_get_rtnl(dev);
  309. if (!p || p->br != br || p->state == BR_STATE_DISABLED)
  310. return -EINVAL;
  311. ip.proto = entry->addr.proto;
  312. if (ip.proto == htons(ETH_P_IP))
  313. ip.u.ip4 = entry->addr.u.ip4;
  314. #if IS_ENABLED(CONFIG_IPV6)
  315. else
  316. ip.u.ip6 = entry->addr.u.ip6;
  317. #endif
  318. spin_lock_bh(&br->multicast_lock);
  319. ret = br_mdb_add_group(br, p, &ip, entry->state);
  320. spin_unlock_bh(&br->multicast_lock);
  321. return ret;
  322. }
  323. static int br_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
  324. {
  325. struct net *net = sock_net(skb->sk);
  326. struct br_mdb_entry *entry;
  327. struct net_device *dev;
  328. struct net_bridge *br;
  329. int err;
  330. err = br_mdb_parse(skb, nlh, &dev, &entry);
  331. if (err < 0)
  332. return err;
  333. br = netdev_priv(dev);
  334. err = __br_mdb_add(net, br, entry);
  335. if (!err)
  336. __br_mdb_notify(dev, entry, RTM_NEWMDB);
  337. return err;
  338. }
  339. static int __br_mdb_del(struct net_bridge *br, struct br_mdb_entry *entry)
  340. {
  341. struct net_bridge_mdb_htable *mdb;
  342. struct net_bridge_mdb_entry *mp;
  343. struct net_bridge_port_group *p;
  344. struct net_bridge_port_group __rcu **pp;
  345. struct br_ip ip;
  346. int err = -EINVAL;
  347. if (!netif_running(br->dev) || br->multicast_disabled)
  348. return -EINVAL;
  349. if (timer_pending(&br->multicast_querier_timer))
  350. return -EBUSY;
  351. ip.proto = entry->addr.proto;
  352. if (ip.proto == htons(ETH_P_IP))
  353. ip.u.ip4 = entry->addr.u.ip4;
  354. #if IS_ENABLED(CONFIG_IPV6)
  355. else
  356. ip.u.ip6 = entry->addr.u.ip6;
  357. #endif
  358. spin_lock_bh(&br->multicast_lock);
  359. mdb = mlock_dereference(br->mdb, br);
  360. mp = br_mdb_ip_get(mdb, &ip);
  361. if (!mp)
  362. goto unlock;
  363. for (pp = &mp->ports;
  364. (p = mlock_dereference(*pp, br)) != NULL;
  365. pp = &p->next) {
  366. if (!p->port || p->port->dev->ifindex != entry->ifindex)
  367. continue;
  368. if (p->port->state == BR_STATE_DISABLED)
  369. goto unlock;
  370. rcu_assign_pointer(*pp, p->next);
  371. hlist_del_init(&p->mglist);
  372. del_timer(&p->timer);
  373. call_rcu_bh(&p->rcu, br_multicast_free_pg);
  374. err = 0;
  375. if (!mp->ports && !mp->mglist &&
  376. netif_running(br->dev))
  377. mod_timer(&mp->timer, jiffies);
  378. break;
  379. }
  380. unlock:
  381. spin_unlock_bh(&br->multicast_lock);
  382. return err;
  383. }
  384. static int br_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
  385. {
  386. struct net_device *dev;
  387. struct br_mdb_entry *entry;
  388. struct net_bridge *br;
  389. int err;
  390. err = br_mdb_parse(skb, nlh, &dev, &entry);
  391. if (err < 0)
  392. return err;
  393. br = netdev_priv(dev);
  394. err = __br_mdb_del(br, entry);
  395. if (!err)
  396. __br_mdb_notify(dev, entry, RTM_DELMDB);
  397. return err;
  398. }
  399. void br_mdb_init(void)
  400. {
  401. rtnl_register(PF_BRIDGE, RTM_GETMDB, NULL, br_mdb_dump, NULL);
  402. rtnl_register(PF_BRIDGE, RTM_NEWMDB, br_mdb_add, NULL, NULL);
  403. rtnl_register(PF_BRIDGE, RTM_DELMDB, br_mdb_del, NULL, NULL);
  404. }
  405. void br_mdb_uninit(void)
  406. {
  407. rtnl_unregister(PF_BRIDGE, RTM_GETMDB);
  408. rtnl_unregister(PF_BRIDGE, RTM_NEWMDB);
  409. rtnl_unregister(PF_BRIDGE, RTM_DELMDB);
  410. }