br_if.c 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480
  1. /*
  2. * Userspace interface
  3. * Linux ethernet bridge
  4. *
  5. * Authors:
  6. * Lennert Buytenhek <buytenh@gnu.org>
  7. *
  8. * This program is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU General Public License
  10. * as published by the Free Software Foundation; either version
  11. * 2 of the License, or (at your option) any later version.
  12. */
  13. #include <linux/kernel.h>
  14. #include <linux/netdevice.h>
  15. #include <linux/ethtool.h>
  16. #include <linux/if_arp.h>
  17. #include <linux/module.h>
  18. #include <linux/init.h>
  19. #include <linux/rtnetlink.h>
  20. #include <linux/if_ether.h>
  21. #include <net/sock.h>
  22. #include "br_private.h"
  23. /*
  24. * Determine initial path cost based on speed.
  25. * using recommendations from 802.1d standard
  26. *
  27. * Since driver might sleep need to not be holding any locks.
  28. */
  29. static int port_cost(struct net_device *dev)
  30. {
  31. if (dev->ethtool_ops && dev->ethtool_ops->get_settings) {
  32. struct ethtool_cmd ecmd = { .cmd = ETHTOOL_GSET, };
  33. if (!dev->ethtool_ops->get_settings(dev, &ecmd)) {
  34. switch(ecmd.speed) {
  35. case SPEED_10000:
  36. return 2;
  37. case SPEED_1000:
  38. return 4;
  39. case SPEED_100:
  40. return 19;
  41. case SPEED_10:
  42. return 100;
  43. }
  44. }
  45. }
  46. /* Old silly heuristics based on name */
  47. if (!strncmp(dev->name, "lec", 3))
  48. return 7;
  49. if (!strncmp(dev->name, "plip", 4))
  50. return 2500;
  51. return 100; /* assume old 10Mbps */
  52. }
  53. /*
  54. * Check for port carrier transistions.
  55. * Called from work queue to allow for calling functions that
  56. * might sleep (such as speed check), and to debounce.
  57. */
  58. void br_port_carrier_check(struct net_bridge_port *p)
  59. {
  60. struct net_device *dev = p->dev;
  61. struct net_bridge *br = p->br;
  62. if (netif_carrier_ok(dev))
  63. p->path_cost = port_cost(dev);
  64. if (netif_running(br->dev)) {
  65. spin_lock_bh(&br->lock);
  66. if (netif_carrier_ok(dev)) {
  67. if (p->state == BR_STATE_DISABLED)
  68. br_stp_enable_port(p);
  69. } else {
  70. if (p->state != BR_STATE_DISABLED)
  71. br_stp_disable_port(p);
  72. }
  73. spin_unlock_bh(&br->lock);
  74. }
  75. }
  76. static void release_nbp(struct kobject *kobj)
  77. {
  78. struct net_bridge_port *p
  79. = container_of(kobj, struct net_bridge_port, kobj);
  80. kfree(p);
  81. }
  82. static struct kobj_type brport_ktype = {
  83. #ifdef CONFIG_SYSFS
  84. .sysfs_ops = &brport_sysfs_ops,
  85. #endif
  86. .release = release_nbp,
  87. };
  88. static void destroy_nbp(struct net_bridge_port *p)
  89. {
  90. struct net_device *dev = p->dev;
  91. p->br = NULL;
  92. p->dev = NULL;
  93. dev_put(dev);
  94. kobject_put(&p->kobj);
  95. }
  96. static void destroy_nbp_rcu(struct rcu_head *head)
  97. {
  98. struct net_bridge_port *p =
  99. container_of(head, struct net_bridge_port, rcu);
  100. destroy_nbp(p);
  101. }
  102. /* Delete port(interface) from bridge is done in two steps.
  103. * via RCU. First step, marks device as down. That deletes
  104. * all the timers and stops new packets from flowing through.
  105. *
  106. * Final cleanup doesn't occur until after all CPU's finished
  107. * processing packets.
  108. *
  109. * Protected from multiple admin operations by RTNL mutex
  110. */
  111. static void del_nbp(struct net_bridge_port *p)
  112. {
  113. struct net_bridge *br = p->br;
  114. struct net_device *dev = p->dev;
  115. sysfs_remove_link(br->ifobj, dev->name);
  116. dev_set_promiscuity(dev, -1);
  117. spin_lock_bh(&br->lock);
  118. br_stp_disable_port(p);
  119. spin_unlock_bh(&br->lock);
  120. br_ifinfo_notify(RTM_DELLINK, p);
  121. br_fdb_delete_by_port(br, p, 1);
  122. list_del_rcu(&p->list);
  123. rcu_assign_pointer(dev->br_port, NULL);
  124. kobject_uevent(&p->kobj, KOBJ_REMOVE);
  125. kobject_del(&p->kobj);
  126. call_rcu(&p->rcu, destroy_nbp_rcu);
  127. }
  128. /* called with RTNL */
  129. static void del_br(struct net_bridge *br)
  130. {
  131. struct net_bridge_port *p, *n;
  132. list_for_each_entry_safe(p, n, &br->port_list, list) {
  133. del_nbp(p);
  134. }
  135. del_timer_sync(&br->gc_timer);
  136. br_sysfs_delbr(br->dev);
  137. unregister_netdevice(br->dev);
  138. }
  139. static struct net_device *new_bridge_dev(struct net *net, const char *name)
  140. {
  141. struct net_bridge *br;
  142. struct net_device *dev;
  143. dev = alloc_netdev(sizeof(struct net_bridge), name,
  144. br_dev_setup);
  145. if (!dev)
  146. return NULL;
  147. dev_net_set(dev, net);
  148. br = netdev_priv(dev);
  149. br->dev = dev;
  150. spin_lock_init(&br->lock);
  151. INIT_LIST_HEAD(&br->port_list);
  152. spin_lock_init(&br->hash_lock);
  153. br->bridge_id.prio[0] = 0x80;
  154. br->bridge_id.prio[1] = 0x00;
  155. memcpy(br->group_addr, br_group_address, ETH_ALEN);
  156. br->feature_mask = dev->features;
  157. br->stp_enabled = BR_NO_STP;
  158. br->designated_root = br->bridge_id;
  159. br->root_path_cost = 0;
  160. br->root_port = 0;
  161. br->bridge_max_age = br->max_age = 20 * HZ;
  162. br->bridge_hello_time = br->hello_time = 2 * HZ;
  163. br->bridge_forward_delay = br->forward_delay = 15 * HZ;
  164. br->topology_change = 0;
  165. br->topology_change_detected = 0;
  166. br->ageing_time = 300 * HZ;
  167. br_netfilter_rtable_init(br);
  168. INIT_LIST_HEAD(&br->age_list);
  169. br_stp_timer_init(br);
  170. return dev;
  171. }
  172. /* find an available port number */
  173. static int find_portno(struct net_bridge *br)
  174. {
  175. int index;
  176. struct net_bridge_port *p;
  177. unsigned long *inuse;
  178. inuse = kcalloc(BITS_TO_LONGS(BR_MAX_PORTS), sizeof(unsigned long),
  179. GFP_KERNEL);
  180. if (!inuse)
  181. return -ENOMEM;
  182. set_bit(0, inuse); /* zero is reserved */
  183. list_for_each_entry(p, &br->port_list, list) {
  184. set_bit(p->port_no, inuse);
  185. }
  186. index = find_first_zero_bit(inuse, BR_MAX_PORTS);
  187. kfree(inuse);
  188. return (index >= BR_MAX_PORTS) ? -EXFULL : index;
  189. }
  190. /* called with RTNL but without bridge lock */
  191. static struct net_bridge_port *new_nbp(struct net_bridge *br,
  192. struct net_device *dev)
  193. {
  194. int index;
  195. struct net_bridge_port *p;
  196. index = find_portno(br);
  197. if (index < 0)
  198. return ERR_PTR(index);
  199. p = kzalloc(sizeof(*p), GFP_KERNEL);
  200. if (p == NULL)
  201. return ERR_PTR(-ENOMEM);
  202. p->br = br;
  203. dev_hold(dev);
  204. p->dev = dev;
  205. p->path_cost = port_cost(dev);
  206. p->priority = 0x8000 >> BR_PORT_BITS;
  207. p->port_no = index;
  208. p->flags = 0;
  209. br_init_port(p);
  210. p->state = BR_STATE_DISABLED;
  211. br_stp_port_timer_init(p);
  212. return p;
  213. }
  214. static struct device_type br_type = {
  215. .name = "bridge",
  216. };
  217. int br_add_bridge(struct net *net, const char *name)
  218. {
  219. struct net_device *dev;
  220. int ret;
  221. dev = new_bridge_dev(net, name);
  222. if (!dev)
  223. return -ENOMEM;
  224. rtnl_lock();
  225. if (strchr(dev->name, '%')) {
  226. ret = dev_alloc_name(dev, dev->name);
  227. if (ret < 0)
  228. goto out_free;
  229. }
  230. SET_NETDEV_DEVTYPE(dev, &br_type);
  231. ret = register_netdevice(dev);
  232. if (ret)
  233. goto out_free;
  234. ret = br_sysfs_addbr(dev);
  235. if (ret)
  236. unregister_netdevice(dev);
  237. out:
  238. rtnl_unlock();
  239. return ret;
  240. out_free:
  241. free_netdev(dev);
  242. goto out;
  243. }
  244. int br_del_bridge(struct net *net, const char *name)
  245. {
  246. struct net_device *dev;
  247. int ret = 0;
  248. rtnl_lock();
  249. dev = __dev_get_by_name(net, name);
  250. if (dev == NULL)
  251. ret = -ENXIO; /* Could not find device */
  252. else if (!(dev->priv_flags & IFF_EBRIDGE)) {
  253. /* Attempt to delete non bridge device! */
  254. ret = -EPERM;
  255. }
  256. else if (dev->flags & IFF_UP) {
  257. /* Not shutdown yet. */
  258. ret = -EBUSY;
  259. }
  260. else
  261. del_br(netdev_priv(dev));
  262. rtnl_unlock();
  263. return ret;
  264. }
  265. /* MTU of the bridge pseudo-device: ETH_DATA_LEN or the minimum of the ports */
  266. int br_min_mtu(const struct net_bridge *br)
  267. {
  268. const struct net_bridge_port *p;
  269. int mtu = 0;
  270. ASSERT_RTNL();
  271. if (list_empty(&br->port_list))
  272. mtu = ETH_DATA_LEN;
  273. else {
  274. list_for_each_entry(p, &br->port_list, list) {
  275. if (!mtu || p->dev->mtu < mtu)
  276. mtu = p->dev->mtu;
  277. }
  278. }
  279. return mtu;
  280. }
  281. /*
  282. * Recomputes features using slave's features
  283. */
  284. void br_features_recompute(struct net_bridge *br)
  285. {
  286. struct net_bridge_port *p;
  287. unsigned long features, mask;
  288. features = mask = br->feature_mask;
  289. if (list_empty(&br->port_list))
  290. goto done;
  291. features &= ~NETIF_F_ONE_FOR_ALL;
  292. list_for_each_entry(p, &br->port_list, list) {
  293. features = netdev_increment_features(features,
  294. p->dev->features, mask);
  295. }
  296. done:
  297. br->dev->features = netdev_fix_features(features, NULL);
  298. }
  299. /* called with RTNL */
  300. int br_add_if(struct net_bridge *br, struct net_device *dev)
  301. {
  302. struct net_bridge_port *p;
  303. int err = 0;
  304. /* Don't allow bridging non-ethernet like devices */
  305. if ((dev->flags & IFF_LOOPBACK) ||
  306. dev->type != ARPHRD_ETHER || dev->addr_len != ETH_ALEN)
  307. return -EINVAL;
  308. /* No bridging of bridges */
  309. if (dev->netdev_ops->ndo_start_xmit == br_dev_xmit)
  310. return -ELOOP;
  311. /* Device is already being bridged */
  312. if (dev->br_port != NULL)
  313. return -EBUSY;
  314. p = new_nbp(br, dev);
  315. if (IS_ERR(p))
  316. return PTR_ERR(p);
  317. err = dev_set_promiscuity(dev, 1);
  318. if (err)
  319. goto put_back;
  320. err = kobject_init_and_add(&p->kobj, &brport_ktype, &(dev->dev.kobj),
  321. SYSFS_BRIDGE_PORT_ATTR);
  322. if (err)
  323. goto err0;
  324. err = br_fdb_insert(br, p, dev->dev_addr);
  325. if (err)
  326. goto err1;
  327. err = br_sysfs_addif(p);
  328. if (err)
  329. goto err2;
  330. rcu_assign_pointer(dev->br_port, p);
  331. dev_disable_lro(dev);
  332. list_add_rcu(&p->list, &br->port_list);
  333. spin_lock_bh(&br->lock);
  334. br_stp_recalculate_bridge_id(br);
  335. br_features_recompute(br);
  336. if ((dev->flags & IFF_UP) && netif_carrier_ok(dev) &&
  337. (br->dev->flags & IFF_UP))
  338. br_stp_enable_port(p);
  339. spin_unlock_bh(&br->lock);
  340. br_ifinfo_notify(RTM_NEWLINK, p);
  341. dev_set_mtu(br->dev, br_min_mtu(br));
  342. kobject_uevent(&p->kobj, KOBJ_ADD);
  343. return 0;
  344. err2:
  345. br_fdb_delete_by_port(br, p, 1);
  346. err1:
  347. kobject_put(&p->kobj);
  348. p = NULL; /* kobject_put frees */
  349. err0:
  350. dev_set_promiscuity(dev, -1);
  351. put_back:
  352. dev_put(dev);
  353. kfree(p);
  354. return err;
  355. }
  356. /* called with RTNL */
  357. int br_del_if(struct net_bridge *br, struct net_device *dev)
  358. {
  359. struct net_bridge_port *p = dev->br_port;
  360. if (!p || p->br != br)
  361. return -EINVAL;
  362. del_nbp(p);
  363. spin_lock_bh(&br->lock);
  364. br_stp_recalculate_bridge_id(br);
  365. br_features_recompute(br);
  366. spin_unlock_bh(&br->lock);
  367. return 0;
  368. }
  369. void br_net_exit(struct net *net)
  370. {
  371. struct net_device *dev;
  372. rtnl_lock();
  373. restart:
  374. for_each_netdev(net, dev) {
  375. if (dev->priv_flags & IFF_EBRIDGE) {
  376. del_br(netdev_priv(dev));
  377. goto restart;
  378. }
  379. }
  380. rtnl_unlock();
  381. }