rtnetlink.c 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602
  1. /*
  2. * INET An implementation of the TCP/IP protocol suite for the LINUX
  3. * operating system. INET is implemented using the BSD Socket
  4. * interface as the means of communication with the user level.
  5. *
  6. * Routing netlink socket interface: protocol independent part.
  7. *
  8. * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU General Public License
  12. * as published by the Free Software Foundation; either version
  13. * 2 of the License, or (at your option) any later version.
  14. *
  15. * Fixes:
  16. * Vitaly E. Lavrov RTA_OK arithmetics was wrong.
  17. */
  18. #include <linux/errno.h>
  19. #include <linux/module.h>
  20. #include <linux/types.h>
  21. #include <linux/socket.h>
  22. #include <linux/kernel.h>
  23. #include <linux/timer.h>
  24. #include <linux/string.h>
  25. #include <linux/sockios.h>
  26. #include <linux/net.h>
  27. #include <linux/fcntl.h>
  28. #include <linux/mm.h>
  29. #include <linux/slab.h>
  30. #include <linux/interrupt.h>
  31. #include <linux/capability.h>
  32. #include <linux/skbuff.h>
  33. #include <linux/init.h>
  34. #include <linux/security.h>
  35. #include <linux/mutex.h>
  36. #include <linux/if_addr.h>
  37. #include <linux/pci.h>
  38. #include <asm/uaccess.h>
  39. #include <asm/system.h>
  40. #include <linux/inet.h>
  41. #include <linux/netdevice.h>
  42. #include <net/ip.h>
  43. #include <net/protocol.h>
  44. #include <net/arp.h>
  45. #include <net/route.h>
  46. #include <net/udp.h>
  47. #include <net/sock.h>
  48. #include <net/pkt_sched.h>
  49. #include <net/fib_rules.h>
  50. #include <net/rtnetlink.h>
  51. #include <net/net_namespace.h>
  52. struct rtnl_link {
  53. rtnl_doit_func doit;
  54. rtnl_dumpit_func dumpit;
  55. };
  56. static DEFINE_MUTEX(rtnl_mutex);
  57. void rtnl_lock(void)
  58. {
  59. mutex_lock(&rtnl_mutex);
  60. }
  61. EXPORT_SYMBOL(rtnl_lock);
  62. void __rtnl_unlock(void)
  63. {
  64. mutex_unlock(&rtnl_mutex);
  65. }
  66. void rtnl_unlock(void)
  67. {
  68. /* This fellow will unlock it for us. */
  69. netdev_run_todo();
  70. }
  71. EXPORT_SYMBOL(rtnl_unlock);
  72. int rtnl_trylock(void)
  73. {
  74. return mutex_trylock(&rtnl_mutex);
  75. }
  76. EXPORT_SYMBOL(rtnl_trylock);
  77. int rtnl_is_locked(void)
  78. {
  79. return mutex_is_locked(&rtnl_mutex);
  80. }
  81. EXPORT_SYMBOL(rtnl_is_locked);
  82. #ifdef CONFIG_PROVE_LOCKING
  83. int lockdep_rtnl_is_held(void)
  84. {
  85. return lockdep_is_held(&rtnl_mutex);
  86. }
  87. EXPORT_SYMBOL(lockdep_rtnl_is_held);
  88. #endif /* #ifdef CONFIG_PROVE_LOCKING */
  89. static struct rtnl_link *rtnl_msg_handlers[NPROTO];
  90. static inline int rtm_msgindex(int msgtype)
  91. {
  92. int msgindex = msgtype - RTM_BASE;
  93. /*
  94. * msgindex < 0 implies someone tried to register a netlink
  95. * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
  96. * the message type has not been added to linux/rtnetlink.h
  97. */
  98. BUG_ON(msgindex < 0 || msgindex >= RTM_NR_MSGTYPES);
  99. return msgindex;
  100. }
  101. static rtnl_doit_func rtnl_get_doit(int protocol, int msgindex)
  102. {
  103. struct rtnl_link *tab;
  104. tab = rtnl_msg_handlers[protocol];
  105. if (tab == NULL || tab[msgindex].doit == NULL)
  106. tab = rtnl_msg_handlers[PF_UNSPEC];
  107. return tab ? tab[msgindex].doit : NULL;
  108. }
  109. static rtnl_dumpit_func rtnl_get_dumpit(int protocol, int msgindex)
  110. {
  111. struct rtnl_link *tab;
  112. tab = rtnl_msg_handlers[protocol];
  113. if (tab == NULL || tab[msgindex].dumpit == NULL)
  114. tab = rtnl_msg_handlers[PF_UNSPEC];
  115. return tab ? tab[msgindex].dumpit : NULL;
  116. }
  117. /**
  118. * __rtnl_register - Register a rtnetlink message type
  119. * @protocol: Protocol family or PF_UNSPEC
  120. * @msgtype: rtnetlink message type
  121. * @doit: Function pointer called for each request message
  122. * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
  123. *
  124. * Registers the specified function pointers (at least one of them has
  125. * to be non-NULL) to be called whenever a request message for the
  126. * specified protocol family and message type is received.
  127. *
  128. * The special protocol family PF_UNSPEC may be used to define fallback
  129. * function pointers for the case when no entry for the specific protocol
  130. * family exists.
  131. *
  132. * Returns 0 on success or a negative error code.
  133. */
  134. int __rtnl_register(int protocol, int msgtype,
  135. rtnl_doit_func doit, rtnl_dumpit_func dumpit)
  136. {
  137. struct rtnl_link *tab;
  138. int msgindex;
  139. BUG_ON(protocol < 0 || protocol >= NPROTO);
  140. msgindex = rtm_msgindex(msgtype);
  141. tab = rtnl_msg_handlers[protocol];
  142. if (tab == NULL) {
  143. tab = kcalloc(RTM_NR_MSGTYPES, sizeof(*tab), GFP_KERNEL);
  144. if (tab == NULL)
  145. return -ENOBUFS;
  146. rtnl_msg_handlers[protocol] = tab;
  147. }
  148. if (doit)
  149. tab[msgindex].doit = doit;
  150. if (dumpit)
  151. tab[msgindex].dumpit = dumpit;
  152. return 0;
  153. }
  154. EXPORT_SYMBOL_GPL(__rtnl_register);
  155. /**
  156. * rtnl_register - Register a rtnetlink message type
  157. *
  158. * Identical to __rtnl_register() but panics on failure. This is useful
  159. * as failure of this function is very unlikely, it can only happen due
  160. * to lack of memory when allocating the chain to store all message
  161. * handlers for a protocol. Meant for use in init functions where lack
  162. * of memory implies no sense in continueing.
  163. */
  164. void rtnl_register(int protocol, int msgtype,
  165. rtnl_doit_func doit, rtnl_dumpit_func dumpit)
  166. {
  167. if (__rtnl_register(protocol, msgtype, doit, dumpit) < 0)
  168. panic("Unable to register rtnetlink message handler, "
  169. "protocol = %d, message type = %d\n",
  170. protocol, msgtype);
  171. }
  172. EXPORT_SYMBOL_GPL(rtnl_register);
  173. /**
  174. * rtnl_unregister - Unregister a rtnetlink message type
  175. * @protocol: Protocol family or PF_UNSPEC
  176. * @msgtype: rtnetlink message type
  177. *
  178. * Returns 0 on success or a negative error code.
  179. */
  180. int rtnl_unregister(int protocol, int msgtype)
  181. {
  182. int msgindex;
  183. BUG_ON(protocol < 0 || protocol >= NPROTO);
  184. msgindex = rtm_msgindex(msgtype);
  185. if (rtnl_msg_handlers[protocol] == NULL)
  186. return -ENOENT;
  187. rtnl_msg_handlers[protocol][msgindex].doit = NULL;
  188. rtnl_msg_handlers[protocol][msgindex].dumpit = NULL;
  189. return 0;
  190. }
  191. EXPORT_SYMBOL_GPL(rtnl_unregister);
  192. /**
  193. * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
  194. * @protocol : Protocol family or PF_UNSPEC
  195. *
  196. * Identical to calling rtnl_unregster() for all registered message types
  197. * of a certain protocol family.
  198. */
  199. void rtnl_unregister_all(int protocol)
  200. {
  201. BUG_ON(protocol < 0 || protocol >= NPROTO);
  202. kfree(rtnl_msg_handlers[protocol]);
  203. rtnl_msg_handlers[protocol] = NULL;
  204. }
  205. EXPORT_SYMBOL_GPL(rtnl_unregister_all);
  206. static LIST_HEAD(link_ops);
  207. /**
  208. * __rtnl_link_register - Register rtnl_link_ops with rtnetlink.
  209. * @ops: struct rtnl_link_ops * to register
  210. *
  211. * The caller must hold the rtnl_mutex. This function should be used
  212. * by drivers that create devices during module initialization. It
  213. * must be called before registering the devices.
  214. *
  215. * Returns 0 on success or a negative error code.
  216. */
  217. int __rtnl_link_register(struct rtnl_link_ops *ops)
  218. {
  219. if (!ops->dellink)
  220. ops->dellink = unregister_netdevice_queue;
  221. list_add_tail(&ops->list, &link_ops);
  222. return 0;
  223. }
  224. EXPORT_SYMBOL_GPL(__rtnl_link_register);
  225. /**
  226. * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
  227. * @ops: struct rtnl_link_ops * to register
  228. *
  229. * Returns 0 on success or a negative error code.
  230. */
  231. int rtnl_link_register(struct rtnl_link_ops *ops)
  232. {
  233. int err;
  234. rtnl_lock();
  235. err = __rtnl_link_register(ops);
  236. rtnl_unlock();
  237. return err;
  238. }
  239. EXPORT_SYMBOL_GPL(rtnl_link_register);
  240. static void __rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
  241. {
  242. struct net_device *dev;
  243. LIST_HEAD(list_kill);
  244. for_each_netdev(net, dev) {
  245. if (dev->rtnl_link_ops == ops)
  246. ops->dellink(dev, &list_kill);
  247. }
  248. unregister_netdevice_many(&list_kill);
  249. }
  250. void rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
  251. {
  252. rtnl_lock();
  253. __rtnl_kill_links(net, ops);
  254. rtnl_unlock();
  255. }
  256. EXPORT_SYMBOL_GPL(rtnl_kill_links);
  257. /**
  258. * __rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
  259. * @ops: struct rtnl_link_ops * to unregister
  260. *
  261. * The caller must hold the rtnl_mutex.
  262. */
  263. void __rtnl_link_unregister(struct rtnl_link_ops *ops)
  264. {
  265. struct net *net;
  266. for_each_net(net) {
  267. __rtnl_kill_links(net, ops);
  268. }
  269. list_del(&ops->list);
  270. }
  271. EXPORT_SYMBOL_GPL(__rtnl_link_unregister);
  272. /**
  273. * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
  274. * @ops: struct rtnl_link_ops * to unregister
  275. */
  276. void rtnl_link_unregister(struct rtnl_link_ops *ops)
  277. {
  278. rtnl_lock();
  279. __rtnl_link_unregister(ops);
  280. rtnl_unlock();
  281. }
  282. EXPORT_SYMBOL_GPL(rtnl_link_unregister);
  283. static const struct rtnl_link_ops *rtnl_link_ops_get(const char *kind)
  284. {
  285. const struct rtnl_link_ops *ops;
  286. list_for_each_entry(ops, &link_ops, list) {
  287. if (!strcmp(ops->kind, kind))
  288. return ops;
  289. }
  290. return NULL;
  291. }
  292. static size_t rtnl_link_get_size(const struct net_device *dev)
  293. {
  294. const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
  295. size_t size;
  296. if (!ops)
  297. return 0;
  298. size = nlmsg_total_size(sizeof(struct nlattr)) + /* IFLA_LINKINFO */
  299. nlmsg_total_size(strlen(ops->kind) + 1); /* IFLA_INFO_KIND */
  300. if (ops->get_size)
  301. /* IFLA_INFO_DATA + nested data */
  302. size += nlmsg_total_size(sizeof(struct nlattr)) +
  303. ops->get_size(dev);
  304. if (ops->get_xstats_size)
  305. size += ops->get_xstats_size(dev); /* IFLA_INFO_XSTATS */
  306. return size;
  307. }
  308. static int rtnl_link_fill(struct sk_buff *skb, const struct net_device *dev)
  309. {
  310. const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
  311. struct nlattr *linkinfo, *data;
  312. int err = -EMSGSIZE;
  313. linkinfo = nla_nest_start(skb, IFLA_LINKINFO);
  314. if (linkinfo == NULL)
  315. goto out;
  316. if (nla_put_string(skb, IFLA_INFO_KIND, ops->kind) < 0)
  317. goto err_cancel_link;
  318. if (ops->fill_xstats) {
  319. err = ops->fill_xstats(skb, dev);
  320. if (err < 0)
  321. goto err_cancel_link;
  322. }
  323. if (ops->fill_info) {
  324. data = nla_nest_start(skb, IFLA_INFO_DATA);
  325. if (data == NULL)
  326. goto err_cancel_link;
  327. err = ops->fill_info(skb, dev);
  328. if (err < 0)
  329. goto err_cancel_data;
  330. nla_nest_end(skb, data);
  331. }
  332. nla_nest_end(skb, linkinfo);
  333. return 0;
  334. err_cancel_data:
  335. nla_nest_cancel(skb, data);
  336. err_cancel_link:
  337. nla_nest_cancel(skb, linkinfo);
  338. out:
  339. return err;
  340. }
  341. static const int rtm_min[RTM_NR_FAMILIES] =
  342. {
  343. [RTM_FAM(RTM_NEWLINK)] = NLMSG_LENGTH(sizeof(struct ifinfomsg)),
  344. [RTM_FAM(RTM_NEWADDR)] = NLMSG_LENGTH(sizeof(struct ifaddrmsg)),
  345. [RTM_FAM(RTM_NEWROUTE)] = NLMSG_LENGTH(sizeof(struct rtmsg)),
  346. [RTM_FAM(RTM_NEWRULE)] = NLMSG_LENGTH(sizeof(struct fib_rule_hdr)),
  347. [RTM_FAM(RTM_NEWQDISC)] = NLMSG_LENGTH(sizeof(struct tcmsg)),
  348. [RTM_FAM(RTM_NEWTCLASS)] = NLMSG_LENGTH(sizeof(struct tcmsg)),
  349. [RTM_FAM(RTM_NEWTFILTER)] = NLMSG_LENGTH(sizeof(struct tcmsg)),
  350. [RTM_FAM(RTM_NEWACTION)] = NLMSG_LENGTH(sizeof(struct tcamsg)),
  351. [RTM_FAM(RTM_GETMULTICAST)] = NLMSG_LENGTH(sizeof(struct rtgenmsg)),
  352. [RTM_FAM(RTM_GETANYCAST)] = NLMSG_LENGTH(sizeof(struct rtgenmsg)),
  353. };
  354. static const int rta_max[RTM_NR_FAMILIES] =
  355. {
  356. [RTM_FAM(RTM_NEWLINK)] = IFLA_MAX,
  357. [RTM_FAM(RTM_NEWADDR)] = IFA_MAX,
  358. [RTM_FAM(RTM_NEWROUTE)] = RTA_MAX,
  359. [RTM_FAM(RTM_NEWRULE)] = FRA_MAX,
  360. [RTM_FAM(RTM_NEWQDISC)] = TCA_MAX,
  361. [RTM_FAM(RTM_NEWTCLASS)] = TCA_MAX,
  362. [RTM_FAM(RTM_NEWTFILTER)] = TCA_MAX,
  363. [RTM_FAM(RTM_NEWACTION)] = TCAA_MAX,
  364. };
  365. void __rta_fill(struct sk_buff *skb, int attrtype, int attrlen, const void *data)
  366. {
  367. struct rtattr *rta;
  368. int size = RTA_LENGTH(attrlen);
  369. rta = (struct rtattr *)skb_put(skb, RTA_ALIGN(size));
  370. rta->rta_type = attrtype;
  371. rta->rta_len = size;
  372. memcpy(RTA_DATA(rta), data, attrlen);
  373. memset(RTA_DATA(rta) + attrlen, 0, RTA_ALIGN(size) - size);
  374. }
  375. EXPORT_SYMBOL(__rta_fill);
  376. int rtnetlink_send(struct sk_buff *skb, struct net *net, u32 pid, unsigned group, int echo)
  377. {
  378. struct sock *rtnl = net->rtnl;
  379. int err = 0;
  380. NETLINK_CB(skb).dst_group = group;
  381. if (echo)
  382. atomic_inc(&skb->users);
  383. netlink_broadcast(rtnl, skb, pid, group, GFP_KERNEL);
  384. if (echo)
  385. err = netlink_unicast(rtnl, skb, pid, MSG_DONTWAIT);
  386. return err;
  387. }
  388. int rtnl_unicast(struct sk_buff *skb, struct net *net, u32 pid)
  389. {
  390. struct sock *rtnl = net->rtnl;
  391. return nlmsg_unicast(rtnl, skb, pid);
  392. }
  393. EXPORT_SYMBOL(rtnl_unicast);
  394. void rtnl_notify(struct sk_buff *skb, struct net *net, u32 pid, u32 group,
  395. struct nlmsghdr *nlh, gfp_t flags)
  396. {
  397. struct sock *rtnl = net->rtnl;
  398. int report = 0;
  399. if (nlh)
  400. report = nlmsg_report(nlh);
  401. nlmsg_notify(rtnl, skb, pid, group, report, flags);
  402. }
  403. EXPORT_SYMBOL(rtnl_notify);
  404. void rtnl_set_sk_err(struct net *net, u32 group, int error)
  405. {
  406. struct sock *rtnl = net->rtnl;
  407. netlink_set_err(rtnl, 0, group, error);
  408. }
  409. EXPORT_SYMBOL(rtnl_set_sk_err);
  410. int rtnetlink_put_metrics(struct sk_buff *skb, u32 *metrics)
  411. {
  412. struct nlattr *mx;
  413. int i, valid = 0;
  414. mx = nla_nest_start(skb, RTA_METRICS);
  415. if (mx == NULL)
  416. return -ENOBUFS;
  417. for (i = 0; i < RTAX_MAX; i++) {
  418. if (metrics[i]) {
  419. valid++;
  420. NLA_PUT_U32(skb, i+1, metrics[i]);
  421. }
  422. }
  423. if (!valid) {
  424. nla_nest_cancel(skb, mx);
  425. return 0;
  426. }
  427. return nla_nest_end(skb, mx);
  428. nla_put_failure:
  429. nla_nest_cancel(skb, mx);
  430. return -EMSGSIZE;
  431. }
  432. EXPORT_SYMBOL(rtnetlink_put_metrics);
  433. int rtnl_put_cacheinfo(struct sk_buff *skb, struct dst_entry *dst, u32 id,
  434. u32 ts, u32 tsage, long expires, u32 error)
  435. {
  436. struct rta_cacheinfo ci = {
  437. .rta_lastuse = jiffies_to_clock_t(jiffies - dst->lastuse),
  438. .rta_used = dst->__use,
  439. .rta_clntref = atomic_read(&(dst->__refcnt)),
  440. .rta_error = error,
  441. .rta_id = id,
  442. .rta_ts = ts,
  443. .rta_tsage = tsage,
  444. };
  445. if (expires)
  446. ci.rta_expires = jiffies_to_clock_t(expires);
  447. return nla_put(skb, RTA_CACHEINFO, sizeof(ci), &ci);
  448. }
  449. EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo);
  450. static void set_operstate(struct net_device *dev, unsigned char transition)
  451. {
  452. unsigned char operstate = dev->operstate;
  453. switch (transition) {
  454. case IF_OPER_UP:
  455. if ((operstate == IF_OPER_DORMANT ||
  456. operstate == IF_OPER_UNKNOWN) &&
  457. !netif_dormant(dev))
  458. operstate = IF_OPER_UP;
  459. break;
  460. case IF_OPER_DORMANT:
  461. if (operstate == IF_OPER_UP ||
  462. operstate == IF_OPER_UNKNOWN)
  463. operstate = IF_OPER_DORMANT;
  464. break;
  465. }
  466. if (dev->operstate != operstate) {
  467. write_lock_bh(&dev_base_lock);
  468. dev->operstate = operstate;
  469. write_unlock_bh(&dev_base_lock);
  470. netdev_state_change(dev);
  471. }
  472. }
  473. static unsigned int rtnl_dev_combine_flags(const struct net_device *dev,
  474. const struct ifinfomsg *ifm)
  475. {
  476. unsigned int flags = ifm->ifi_flags;
  477. /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
  478. if (ifm->ifi_change)
  479. flags = (flags & ifm->ifi_change) |
  480. (dev->flags & ~ifm->ifi_change);
  481. return flags;
  482. }
  483. static void copy_rtnl_link_stats(struct rtnl_link_stats *a,
  484. const struct net_device_stats *b)
  485. {
  486. a->rx_packets = b->rx_packets;
  487. a->tx_packets = b->tx_packets;
  488. a->rx_bytes = b->rx_bytes;
  489. a->tx_bytes = b->tx_bytes;
  490. a->rx_errors = b->rx_errors;
  491. a->tx_errors = b->tx_errors;
  492. a->rx_dropped = b->rx_dropped;
  493. a->tx_dropped = b->tx_dropped;
  494. a->multicast = b->multicast;
  495. a->collisions = b->collisions;
  496. a->rx_length_errors = b->rx_length_errors;
  497. a->rx_over_errors = b->rx_over_errors;
  498. a->rx_crc_errors = b->rx_crc_errors;
  499. a->rx_frame_errors = b->rx_frame_errors;
  500. a->rx_fifo_errors = b->rx_fifo_errors;
  501. a->rx_missed_errors = b->rx_missed_errors;
  502. a->tx_aborted_errors = b->tx_aborted_errors;
  503. a->tx_carrier_errors = b->tx_carrier_errors;
  504. a->tx_fifo_errors = b->tx_fifo_errors;
  505. a->tx_heartbeat_errors = b->tx_heartbeat_errors;
  506. a->tx_window_errors = b->tx_window_errors;
  507. a->rx_compressed = b->rx_compressed;
  508. a->tx_compressed = b->tx_compressed;
  509. };
  510. /* All VF info */
  511. static inline int rtnl_vfinfo_size(const struct net_device *dev)
  512. {
  513. if (dev->dev.parent && dev_is_pci(dev->dev.parent)) {
  514. int num_vfs = dev_num_vf(dev->dev.parent);
  515. size_t size = nlmsg_total_size(sizeof(struct nlattr));
  516. size += nlmsg_total_size(num_vfs * sizeof(struct nlattr));
  517. size += num_vfs * (sizeof(struct ifla_vf_mac) +
  518. sizeof(struct ifla_vf_vlan) +
  519. sizeof(struct ifla_vf_tx_rate));
  520. return size;
  521. } else
  522. return 0;
  523. }
  524. static inline size_t if_nlmsg_size(const struct net_device *dev)
  525. {
  526. return NLMSG_ALIGN(sizeof(struct ifinfomsg))
  527. + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
  528. + nla_total_size(IFALIASZ) /* IFLA_IFALIAS */
  529. + nla_total_size(IFNAMSIZ) /* IFLA_QDISC */
  530. + nla_total_size(sizeof(struct rtnl_link_ifmap))
  531. + nla_total_size(sizeof(struct rtnl_link_stats))
  532. + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
  533. + nla_total_size(MAX_ADDR_LEN) /* IFLA_BROADCAST */
  534. + nla_total_size(4) /* IFLA_TXQLEN */
  535. + nla_total_size(4) /* IFLA_WEIGHT */
  536. + nla_total_size(4) /* IFLA_MTU */
  537. + nla_total_size(4) /* IFLA_LINK */
  538. + nla_total_size(4) /* IFLA_MASTER */
  539. + nla_total_size(1) /* IFLA_OPERSTATE */
  540. + nla_total_size(1) /* IFLA_LINKMODE */
  541. + nla_total_size(4) /* IFLA_NUM_VF */
  542. + rtnl_vfinfo_size(dev) /* IFLA_VFINFO_LIST */
  543. + rtnl_link_get_size(dev); /* IFLA_LINKINFO */
  544. }
  545. static int rtnl_fill_ifinfo(struct sk_buff *skb, struct net_device *dev,
  546. int type, u32 pid, u32 seq, u32 change,
  547. unsigned int flags)
  548. {
  549. struct ifinfomsg *ifm;
  550. struct nlmsghdr *nlh;
  551. const struct net_device_stats *stats;
  552. struct nlattr *attr;
  553. nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifm), flags);
  554. if (nlh == NULL)
  555. return -EMSGSIZE;
  556. ifm = nlmsg_data(nlh);
  557. ifm->ifi_family = AF_UNSPEC;
  558. ifm->__ifi_pad = 0;
  559. ifm->ifi_type = dev->type;
  560. ifm->ifi_index = dev->ifindex;
  561. ifm->ifi_flags = dev_get_flags(dev);
  562. ifm->ifi_change = change;
  563. NLA_PUT_STRING(skb, IFLA_IFNAME, dev->name);
  564. NLA_PUT_U32(skb, IFLA_TXQLEN, dev->tx_queue_len);
  565. NLA_PUT_U8(skb, IFLA_OPERSTATE,
  566. netif_running(dev) ? dev->operstate : IF_OPER_DOWN);
  567. NLA_PUT_U8(skb, IFLA_LINKMODE, dev->link_mode);
  568. NLA_PUT_U32(skb, IFLA_MTU, dev->mtu);
  569. if (dev->ifindex != dev->iflink)
  570. NLA_PUT_U32(skb, IFLA_LINK, dev->iflink);
  571. if (dev->master)
  572. NLA_PUT_U32(skb, IFLA_MASTER, dev->master->ifindex);
  573. if (dev->qdisc)
  574. NLA_PUT_STRING(skb, IFLA_QDISC, dev->qdisc->ops->id);
  575. if (dev->ifalias)
  576. NLA_PUT_STRING(skb, IFLA_IFALIAS, dev->ifalias);
  577. if (1) {
  578. struct rtnl_link_ifmap map = {
  579. .mem_start = dev->mem_start,
  580. .mem_end = dev->mem_end,
  581. .base_addr = dev->base_addr,
  582. .irq = dev->irq,
  583. .dma = dev->dma,
  584. .port = dev->if_port,
  585. };
  586. NLA_PUT(skb, IFLA_MAP, sizeof(map), &map);
  587. }
  588. if (dev->addr_len) {
  589. NLA_PUT(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr);
  590. NLA_PUT(skb, IFLA_BROADCAST, dev->addr_len, dev->broadcast);
  591. }
  592. attr = nla_reserve(skb, IFLA_STATS,
  593. sizeof(struct rtnl_link_stats));
  594. if (attr == NULL)
  595. goto nla_put_failure;
  596. stats = dev_get_stats(dev);
  597. copy_rtnl_link_stats(nla_data(attr), stats);
  598. if (dev->netdev_ops->ndo_get_vf_config && dev->dev.parent) {
  599. int i;
  600. struct nlattr *vfinfo, *vf;
  601. int num_vfs = dev_num_vf(dev->dev.parent);
  602. NLA_PUT_U32(skb, IFLA_NUM_VF, num_vfs);
  603. vfinfo = nla_nest_start(skb, IFLA_VFINFO_LIST);
  604. if (!vfinfo)
  605. goto nla_put_failure;
  606. for (i = 0; i < num_vfs; i++) {
  607. struct ifla_vf_info ivi;
  608. struct ifla_vf_mac vf_mac;
  609. struct ifla_vf_vlan vf_vlan;
  610. struct ifla_vf_tx_rate vf_tx_rate;
  611. if (dev->netdev_ops->ndo_get_vf_config(dev, i, &ivi))
  612. break;
  613. vf_mac.vf = vf_vlan.vf = vf_tx_rate.vf = ivi.vf;
  614. memcpy(vf_mac.mac, ivi.mac, sizeof(ivi.mac));
  615. vf_vlan.vlan = ivi.vlan;
  616. vf_vlan.qos = ivi.qos;
  617. vf_tx_rate.rate = ivi.tx_rate;
  618. vf = nla_nest_start(skb, IFLA_VF_INFO);
  619. if (!vf) {
  620. nla_nest_cancel(skb, vfinfo);
  621. goto nla_put_failure;
  622. }
  623. NLA_PUT(skb, IFLA_VF_MAC, sizeof(vf_mac), &vf_mac);
  624. NLA_PUT(skb, IFLA_VF_VLAN, sizeof(vf_vlan), &vf_vlan);
  625. NLA_PUT(skb, IFLA_VF_TX_RATE, sizeof(vf_tx_rate), &vf_tx_rate);
  626. nla_nest_end(skb, vf);
  627. }
  628. nla_nest_end(skb, vfinfo);
  629. }
  630. if (dev->rtnl_link_ops) {
  631. if (rtnl_link_fill(skb, dev) < 0)
  632. goto nla_put_failure;
  633. }
  634. return nlmsg_end(skb, nlh);
  635. nla_put_failure:
  636. nlmsg_cancel(skb, nlh);
  637. return -EMSGSIZE;
  638. }
  639. static int rtnl_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb)
  640. {
  641. struct net *net = sock_net(skb->sk);
  642. int h, s_h;
  643. int idx = 0, s_idx;
  644. struct net_device *dev;
  645. struct hlist_head *head;
  646. struct hlist_node *node;
  647. s_h = cb->args[0];
  648. s_idx = cb->args[1];
  649. for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
  650. idx = 0;
  651. head = &net->dev_index_head[h];
  652. hlist_for_each_entry(dev, node, head, index_hlist) {
  653. if (idx < s_idx)
  654. goto cont;
  655. if (rtnl_fill_ifinfo(skb, dev, RTM_NEWLINK,
  656. NETLINK_CB(cb->skb).pid,
  657. cb->nlh->nlmsg_seq, 0,
  658. NLM_F_MULTI) <= 0)
  659. goto out;
  660. cont:
  661. idx++;
  662. }
  663. }
  664. out:
  665. cb->args[1] = idx;
  666. cb->args[0] = h;
  667. return skb->len;
  668. }
  669. const struct nla_policy ifla_policy[IFLA_MAX+1] = {
  670. [IFLA_IFNAME] = { .type = NLA_STRING, .len = IFNAMSIZ-1 },
  671. [IFLA_ADDRESS] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
  672. [IFLA_BROADCAST] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
  673. [IFLA_MAP] = { .len = sizeof(struct rtnl_link_ifmap) },
  674. [IFLA_MTU] = { .type = NLA_U32 },
  675. [IFLA_LINK] = { .type = NLA_U32 },
  676. [IFLA_TXQLEN] = { .type = NLA_U32 },
  677. [IFLA_WEIGHT] = { .type = NLA_U32 },
  678. [IFLA_OPERSTATE] = { .type = NLA_U8 },
  679. [IFLA_LINKMODE] = { .type = NLA_U8 },
  680. [IFLA_LINKINFO] = { .type = NLA_NESTED },
  681. [IFLA_NET_NS_PID] = { .type = NLA_U32 },
  682. [IFLA_IFALIAS] = { .type = NLA_STRING, .len = IFALIASZ-1 },
  683. [IFLA_VFINFO_LIST] = {. type = NLA_NESTED },
  684. };
  685. EXPORT_SYMBOL(ifla_policy);
  686. static const struct nla_policy ifla_info_policy[IFLA_INFO_MAX+1] = {
  687. [IFLA_INFO_KIND] = { .type = NLA_STRING },
  688. [IFLA_INFO_DATA] = { .type = NLA_NESTED },
  689. };
  690. static const struct nla_policy ifla_vfinfo_policy[IFLA_VF_INFO_MAX+1] = {
  691. [IFLA_VF_INFO] = { .type = NLA_NESTED },
  692. };
  693. static const struct nla_policy ifla_vf_policy[IFLA_VF_MAX+1] = {
  694. [IFLA_VF_MAC] = { .type = NLA_BINARY,
  695. .len = sizeof(struct ifla_vf_mac) },
  696. [IFLA_VF_VLAN] = { .type = NLA_BINARY,
  697. .len = sizeof(struct ifla_vf_vlan) },
  698. [IFLA_VF_TX_RATE] = { .type = NLA_BINARY,
  699. .len = sizeof(struct ifla_vf_tx_rate) },
  700. };
  701. struct net *rtnl_link_get_net(struct net *src_net, struct nlattr *tb[])
  702. {
  703. struct net *net;
  704. /* Examine the link attributes and figure out which
  705. * network namespace we are talking about.
  706. */
  707. if (tb[IFLA_NET_NS_PID])
  708. net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID]));
  709. else
  710. net = get_net(src_net);
  711. return net;
  712. }
  713. EXPORT_SYMBOL(rtnl_link_get_net);
  714. static int validate_linkmsg(struct net_device *dev, struct nlattr *tb[])
  715. {
  716. if (dev) {
  717. if (tb[IFLA_ADDRESS] &&
  718. nla_len(tb[IFLA_ADDRESS]) < dev->addr_len)
  719. return -EINVAL;
  720. if (tb[IFLA_BROADCAST] &&
  721. nla_len(tb[IFLA_BROADCAST]) < dev->addr_len)
  722. return -EINVAL;
  723. }
  724. return 0;
  725. }
  726. static int do_setvfinfo(struct net_device *dev, struct nlattr *attr)
  727. {
  728. int rem, err = -EINVAL;
  729. struct nlattr *vf;
  730. const struct net_device_ops *ops = dev->netdev_ops;
  731. nla_for_each_nested(vf, attr, rem) {
  732. switch (nla_type(vf)) {
  733. case IFLA_VF_MAC: {
  734. struct ifla_vf_mac *ivm;
  735. ivm = nla_data(vf);
  736. err = -EOPNOTSUPP;
  737. if (ops->ndo_set_vf_mac)
  738. err = ops->ndo_set_vf_mac(dev, ivm->vf,
  739. ivm->mac);
  740. break;
  741. }
  742. case IFLA_VF_VLAN: {
  743. struct ifla_vf_vlan *ivv;
  744. ivv = nla_data(vf);
  745. err = -EOPNOTSUPP;
  746. if (ops->ndo_set_vf_vlan)
  747. err = ops->ndo_set_vf_vlan(dev, ivv->vf,
  748. ivv->vlan,
  749. ivv->qos);
  750. break;
  751. }
  752. case IFLA_VF_TX_RATE: {
  753. struct ifla_vf_tx_rate *ivt;
  754. ivt = nla_data(vf);
  755. err = -EOPNOTSUPP;
  756. if (ops->ndo_set_vf_tx_rate)
  757. err = ops->ndo_set_vf_tx_rate(dev, ivt->vf,
  758. ivt->rate);
  759. break;
  760. }
  761. default:
  762. err = -EINVAL;
  763. break;
  764. }
  765. if (err)
  766. break;
  767. }
  768. return err;
  769. }
  770. static int do_setlink(struct net_device *dev, struct ifinfomsg *ifm,
  771. struct nlattr **tb, char *ifname, int modified)
  772. {
  773. const struct net_device_ops *ops = dev->netdev_ops;
  774. int send_addr_notify = 0;
  775. int err;
  776. if (tb[IFLA_NET_NS_PID]) {
  777. struct net *net = rtnl_link_get_net(dev_net(dev), tb);
  778. if (IS_ERR(net)) {
  779. err = PTR_ERR(net);
  780. goto errout;
  781. }
  782. err = dev_change_net_namespace(dev, net, ifname);
  783. put_net(net);
  784. if (err)
  785. goto errout;
  786. modified = 1;
  787. }
  788. if (tb[IFLA_MAP]) {
  789. struct rtnl_link_ifmap *u_map;
  790. struct ifmap k_map;
  791. if (!ops->ndo_set_config) {
  792. err = -EOPNOTSUPP;
  793. goto errout;
  794. }
  795. if (!netif_device_present(dev)) {
  796. err = -ENODEV;
  797. goto errout;
  798. }
  799. u_map = nla_data(tb[IFLA_MAP]);
  800. k_map.mem_start = (unsigned long) u_map->mem_start;
  801. k_map.mem_end = (unsigned long) u_map->mem_end;
  802. k_map.base_addr = (unsigned short) u_map->base_addr;
  803. k_map.irq = (unsigned char) u_map->irq;
  804. k_map.dma = (unsigned char) u_map->dma;
  805. k_map.port = (unsigned char) u_map->port;
  806. err = ops->ndo_set_config(dev, &k_map);
  807. if (err < 0)
  808. goto errout;
  809. modified = 1;
  810. }
  811. if (tb[IFLA_ADDRESS]) {
  812. struct sockaddr *sa;
  813. int len;
  814. if (!ops->ndo_set_mac_address) {
  815. err = -EOPNOTSUPP;
  816. goto errout;
  817. }
  818. if (!netif_device_present(dev)) {
  819. err = -ENODEV;
  820. goto errout;
  821. }
  822. len = sizeof(sa_family_t) + dev->addr_len;
  823. sa = kmalloc(len, GFP_KERNEL);
  824. if (!sa) {
  825. err = -ENOMEM;
  826. goto errout;
  827. }
  828. sa->sa_family = dev->type;
  829. memcpy(sa->sa_data, nla_data(tb[IFLA_ADDRESS]),
  830. dev->addr_len);
  831. err = ops->ndo_set_mac_address(dev, sa);
  832. kfree(sa);
  833. if (err)
  834. goto errout;
  835. send_addr_notify = 1;
  836. modified = 1;
  837. }
  838. if (tb[IFLA_MTU]) {
  839. err = dev_set_mtu(dev, nla_get_u32(tb[IFLA_MTU]));
  840. if (err < 0)
  841. goto errout;
  842. modified = 1;
  843. }
  844. /*
  845. * Interface selected by interface index but interface
  846. * name provided implies that a name change has been
  847. * requested.
  848. */
  849. if (ifm->ifi_index > 0 && ifname[0]) {
  850. err = dev_change_name(dev, ifname);
  851. if (err < 0)
  852. goto errout;
  853. modified = 1;
  854. }
  855. if (tb[IFLA_IFALIAS]) {
  856. err = dev_set_alias(dev, nla_data(tb[IFLA_IFALIAS]),
  857. nla_len(tb[IFLA_IFALIAS]));
  858. if (err < 0)
  859. goto errout;
  860. modified = 1;
  861. }
  862. if (tb[IFLA_BROADCAST]) {
  863. nla_memcpy(dev->broadcast, tb[IFLA_BROADCAST], dev->addr_len);
  864. send_addr_notify = 1;
  865. }
  866. if (ifm->ifi_flags || ifm->ifi_change) {
  867. err = dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm));
  868. if (err < 0)
  869. goto errout;
  870. }
  871. if (tb[IFLA_TXQLEN])
  872. dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
  873. if (tb[IFLA_OPERSTATE])
  874. set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
  875. if (tb[IFLA_LINKMODE]) {
  876. write_lock_bh(&dev_base_lock);
  877. dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
  878. write_unlock_bh(&dev_base_lock);
  879. }
  880. if (tb[IFLA_VFINFO_LIST]) {
  881. struct nlattr *attr;
  882. int rem;
  883. nla_for_each_nested(attr, tb[IFLA_VFINFO_LIST], rem) {
  884. if (nla_type(attr) != IFLA_VF_INFO)
  885. goto errout;
  886. err = do_setvfinfo(dev, attr);
  887. if (err < 0)
  888. goto errout;
  889. modified = 1;
  890. }
  891. }
  892. err = 0;
  893. errout:
  894. if (err < 0 && modified && net_ratelimit())
  895. printk(KERN_WARNING "A link change request failed with "
  896. "some changes comitted already. Interface %s may "
  897. "have been left with an inconsistent configuration, "
  898. "please check.\n", dev->name);
  899. if (send_addr_notify)
  900. call_netdevice_notifiers(NETDEV_CHANGEADDR, dev);
  901. return err;
  902. }
  903. static int rtnl_setlink(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
  904. {
  905. struct net *net = sock_net(skb->sk);
  906. struct ifinfomsg *ifm;
  907. struct net_device *dev;
  908. int err;
  909. struct nlattr *tb[IFLA_MAX+1];
  910. char ifname[IFNAMSIZ];
  911. err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
  912. if (err < 0)
  913. goto errout;
  914. if (tb[IFLA_IFNAME])
  915. nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
  916. else
  917. ifname[0] = '\0';
  918. err = -EINVAL;
  919. ifm = nlmsg_data(nlh);
  920. if (ifm->ifi_index > 0)
  921. dev = __dev_get_by_index(net, ifm->ifi_index);
  922. else if (tb[IFLA_IFNAME])
  923. dev = __dev_get_by_name(net, ifname);
  924. else
  925. goto errout;
  926. if (dev == NULL) {
  927. err = -ENODEV;
  928. goto errout;
  929. }
  930. err = validate_linkmsg(dev, tb);
  931. if (err < 0)
  932. goto errout;
  933. err = do_setlink(dev, ifm, tb, ifname, 0);
  934. errout:
  935. return err;
  936. }
  937. static int rtnl_dellink(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
  938. {
  939. struct net *net = sock_net(skb->sk);
  940. const struct rtnl_link_ops *ops;
  941. struct net_device *dev;
  942. struct ifinfomsg *ifm;
  943. char ifname[IFNAMSIZ];
  944. struct nlattr *tb[IFLA_MAX+1];
  945. int err;
  946. err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
  947. if (err < 0)
  948. return err;
  949. if (tb[IFLA_IFNAME])
  950. nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
  951. ifm = nlmsg_data(nlh);
  952. if (ifm->ifi_index > 0)
  953. dev = __dev_get_by_index(net, ifm->ifi_index);
  954. else if (tb[IFLA_IFNAME])
  955. dev = __dev_get_by_name(net, ifname);
  956. else
  957. return -EINVAL;
  958. if (!dev)
  959. return -ENODEV;
  960. ops = dev->rtnl_link_ops;
  961. if (!ops)
  962. return -EOPNOTSUPP;
  963. ops->dellink(dev, NULL);
  964. return 0;
  965. }
  966. int rtnl_configure_link(struct net_device *dev, const struct ifinfomsg *ifm)
  967. {
  968. unsigned int old_flags;
  969. int err;
  970. old_flags = dev->flags;
  971. if (ifm && (ifm->ifi_flags || ifm->ifi_change)) {
  972. err = __dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm));
  973. if (err < 0)
  974. return err;
  975. }
  976. dev->rtnl_link_state = RTNL_LINK_INITIALIZED;
  977. rtmsg_ifinfo(RTM_NEWLINK, dev, ~0U);
  978. __dev_notify_flags(dev, old_flags);
  979. return 0;
  980. }
  981. EXPORT_SYMBOL(rtnl_configure_link);
  982. struct net_device *rtnl_create_link(struct net *src_net, struct net *net,
  983. char *ifname, const struct rtnl_link_ops *ops, struct nlattr *tb[])
  984. {
  985. int err;
  986. struct net_device *dev;
  987. unsigned int num_queues = 1;
  988. unsigned int real_num_queues = 1;
  989. if (ops->get_tx_queues) {
  990. err = ops->get_tx_queues(src_net, tb, &num_queues,
  991. &real_num_queues);
  992. if (err)
  993. goto err;
  994. }
  995. err = -ENOMEM;
  996. dev = alloc_netdev_mq(ops->priv_size, ifname, ops->setup, num_queues);
  997. if (!dev)
  998. goto err;
  999. dev_net_set(dev, net);
  1000. dev->rtnl_link_ops = ops;
  1001. dev->rtnl_link_state = RTNL_LINK_INITIALIZING;
  1002. dev->real_num_tx_queues = real_num_queues;
  1003. if (strchr(dev->name, '%')) {
  1004. err = dev_alloc_name(dev, dev->name);
  1005. if (err < 0)
  1006. goto err_free;
  1007. }
  1008. if (tb[IFLA_MTU])
  1009. dev->mtu = nla_get_u32(tb[IFLA_MTU]);
  1010. if (tb[IFLA_ADDRESS])
  1011. memcpy(dev->dev_addr, nla_data(tb[IFLA_ADDRESS]),
  1012. nla_len(tb[IFLA_ADDRESS]));
  1013. if (tb[IFLA_BROADCAST])
  1014. memcpy(dev->broadcast, nla_data(tb[IFLA_BROADCAST]),
  1015. nla_len(tb[IFLA_BROADCAST]));
  1016. if (tb[IFLA_TXQLEN])
  1017. dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
  1018. if (tb[IFLA_OPERSTATE])
  1019. set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
  1020. if (tb[IFLA_LINKMODE])
  1021. dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
  1022. return dev;
  1023. err_free:
  1024. free_netdev(dev);
  1025. err:
  1026. return ERR_PTR(err);
  1027. }
  1028. EXPORT_SYMBOL(rtnl_create_link);
  1029. static int rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
  1030. {
  1031. struct net *net = sock_net(skb->sk);
  1032. const struct rtnl_link_ops *ops;
  1033. struct net_device *dev;
  1034. struct ifinfomsg *ifm;
  1035. char kind[MODULE_NAME_LEN];
  1036. char ifname[IFNAMSIZ];
  1037. struct nlattr *tb[IFLA_MAX+1];
  1038. struct nlattr *linkinfo[IFLA_INFO_MAX+1];
  1039. int err;
  1040. #ifdef CONFIG_MODULES
  1041. replay:
  1042. #endif
  1043. err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
  1044. if (err < 0)
  1045. return err;
  1046. if (tb[IFLA_IFNAME])
  1047. nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
  1048. else
  1049. ifname[0] = '\0';
  1050. ifm = nlmsg_data(nlh);
  1051. if (ifm->ifi_index > 0)
  1052. dev = __dev_get_by_index(net, ifm->ifi_index);
  1053. else if (ifname[0])
  1054. dev = __dev_get_by_name(net, ifname);
  1055. else
  1056. dev = NULL;
  1057. err = validate_linkmsg(dev, tb);
  1058. if (err < 0)
  1059. return err;
  1060. if (tb[IFLA_LINKINFO]) {
  1061. err = nla_parse_nested(linkinfo, IFLA_INFO_MAX,
  1062. tb[IFLA_LINKINFO], ifla_info_policy);
  1063. if (err < 0)
  1064. return err;
  1065. } else
  1066. memset(linkinfo, 0, sizeof(linkinfo));
  1067. if (linkinfo[IFLA_INFO_KIND]) {
  1068. nla_strlcpy(kind, linkinfo[IFLA_INFO_KIND], sizeof(kind));
  1069. ops = rtnl_link_ops_get(kind);
  1070. } else {
  1071. kind[0] = '\0';
  1072. ops = NULL;
  1073. }
  1074. if (1) {
  1075. struct nlattr *attr[ops ? ops->maxtype + 1 : 0], **data = NULL;
  1076. struct net *dest_net;
  1077. if (ops) {
  1078. if (ops->maxtype && linkinfo[IFLA_INFO_DATA]) {
  1079. err = nla_parse_nested(attr, ops->maxtype,
  1080. linkinfo[IFLA_INFO_DATA],
  1081. ops->policy);
  1082. if (err < 0)
  1083. return err;
  1084. data = attr;
  1085. }
  1086. if (ops->validate) {
  1087. err = ops->validate(tb, data);
  1088. if (err < 0)
  1089. return err;
  1090. }
  1091. }
  1092. if (dev) {
  1093. int modified = 0;
  1094. if (nlh->nlmsg_flags & NLM_F_EXCL)
  1095. return -EEXIST;
  1096. if (nlh->nlmsg_flags & NLM_F_REPLACE)
  1097. return -EOPNOTSUPP;
  1098. if (linkinfo[IFLA_INFO_DATA]) {
  1099. if (!ops || ops != dev->rtnl_link_ops ||
  1100. !ops->changelink)
  1101. return -EOPNOTSUPP;
  1102. err = ops->changelink(dev, tb, data);
  1103. if (err < 0)
  1104. return err;
  1105. modified = 1;
  1106. }
  1107. return do_setlink(dev, ifm, tb, ifname, modified);
  1108. }
  1109. if (!(nlh->nlmsg_flags & NLM_F_CREATE))
  1110. return -ENODEV;
  1111. if (ifm->ifi_index)
  1112. return -EOPNOTSUPP;
  1113. if (tb[IFLA_MAP] || tb[IFLA_MASTER] || tb[IFLA_PROTINFO])
  1114. return -EOPNOTSUPP;
  1115. if (!ops) {
  1116. #ifdef CONFIG_MODULES
  1117. if (kind[0]) {
  1118. __rtnl_unlock();
  1119. request_module("rtnl-link-%s", kind);
  1120. rtnl_lock();
  1121. ops = rtnl_link_ops_get(kind);
  1122. if (ops)
  1123. goto replay;
  1124. }
  1125. #endif
  1126. return -EOPNOTSUPP;
  1127. }
  1128. if (!ifname[0])
  1129. snprintf(ifname, IFNAMSIZ, "%s%%d", ops->kind);
  1130. dest_net = rtnl_link_get_net(net, tb);
  1131. dev = rtnl_create_link(net, dest_net, ifname, ops, tb);
  1132. if (IS_ERR(dev))
  1133. err = PTR_ERR(dev);
  1134. else if (ops->newlink)
  1135. err = ops->newlink(net, dev, tb, data);
  1136. else
  1137. err = register_netdevice(dev);
  1138. if (err < 0 && !IS_ERR(dev))
  1139. free_netdev(dev);
  1140. if (err < 0)
  1141. goto out;
  1142. err = rtnl_configure_link(dev, ifm);
  1143. if (err < 0)
  1144. unregister_netdevice(dev);
  1145. out:
  1146. put_net(dest_net);
  1147. return err;
  1148. }
  1149. }
  1150. static int rtnl_getlink(struct sk_buff *skb, struct nlmsghdr* nlh, void *arg)
  1151. {
  1152. struct net *net = sock_net(skb->sk);
  1153. struct ifinfomsg *ifm;
  1154. char ifname[IFNAMSIZ];
  1155. struct nlattr *tb[IFLA_MAX+1];
  1156. struct net_device *dev = NULL;
  1157. struct sk_buff *nskb;
  1158. int err;
  1159. err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
  1160. if (err < 0)
  1161. return err;
  1162. if (tb[IFLA_IFNAME])
  1163. nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
  1164. ifm = nlmsg_data(nlh);
  1165. if (ifm->ifi_index > 0)
  1166. dev = __dev_get_by_index(net, ifm->ifi_index);
  1167. else if (tb[IFLA_IFNAME])
  1168. dev = __dev_get_by_name(net, ifname);
  1169. else
  1170. return -EINVAL;
  1171. if (dev == NULL)
  1172. return -ENODEV;
  1173. nskb = nlmsg_new(if_nlmsg_size(dev), GFP_KERNEL);
  1174. if (nskb == NULL)
  1175. return -ENOBUFS;
  1176. err = rtnl_fill_ifinfo(nskb, dev, RTM_NEWLINK, NETLINK_CB(skb).pid,
  1177. nlh->nlmsg_seq, 0, 0);
  1178. if (err < 0) {
  1179. /* -EMSGSIZE implies BUG in if_nlmsg_size */
  1180. WARN_ON(err == -EMSGSIZE);
  1181. kfree_skb(nskb);
  1182. } else
  1183. err = rtnl_unicast(nskb, net, NETLINK_CB(skb).pid);
  1184. return err;
  1185. }
  1186. static int rtnl_dump_all(struct sk_buff *skb, struct netlink_callback *cb)
  1187. {
  1188. int idx;
  1189. int s_idx = cb->family;
  1190. if (s_idx == 0)
  1191. s_idx = 1;
  1192. for (idx = 1; idx < NPROTO; idx++) {
  1193. int type = cb->nlh->nlmsg_type-RTM_BASE;
  1194. if (idx < s_idx || idx == PF_PACKET)
  1195. continue;
  1196. if (rtnl_msg_handlers[idx] == NULL ||
  1197. rtnl_msg_handlers[idx][type].dumpit == NULL)
  1198. continue;
  1199. if (idx > s_idx)
  1200. memset(&cb->args[0], 0, sizeof(cb->args));
  1201. if (rtnl_msg_handlers[idx][type].dumpit(skb, cb))
  1202. break;
  1203. }
  1204. cb->family = idx;
  1205. return skb->len;
  1206. }
  1207. void rtmsg_ifinfo(int type, struct net_device *dev, unsigned change)
  1208. {
  1209. struct net *net = dev_net(dev);
  1210. struct sk_buff *skb;
  1211. int err = -ENOBUFS;
  1212. skb = nlmsg_new(if_nlmsg_size(dev), GFP_KERNEL);
  1213. if (skb == NULL)
  1214. goto errout;
  1215. err = rtnl_fill_ifinfo(skb, dev, type, 0, 0, change, 0);
  1216. if (err < 0) {
  1217. /* -EMSGSIZE implies BUG in if_nlmsg_size() */
  1218. WARN_ON(err == -EMSGSIZE);
  1219. kfree_skb(skb);
  1220. goto errout;
  1221. }
  1222. rtnl_notify(skb, net, 0, RTNLGRP_LINK, NULL, GFP_KERNEL);
  1223. return;
  1224. errout:
  1225. if (err < 0)
  1226. rtnl_set_sk_err(net, RTNLGRP_LINK, err);
  1227. }
  1228. /* Protected by RTNL sempahore. */
  1229. static struct rtattr **rta_buf;
  1230. static int rtattr_max;
  1231. /* Process one rtnetlink message. */
  1232. static int rtnetlink_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh)
  1233. {
  1234. struct net *net = sock_net(skb->sk);
  1235. rtnl_doit_func doit;
  1236. int sz_idx, kind;
  1237. int min_len;
  1238. int family;
  1239. int type;
  1240. int err;
  1241. type = nlh->nlmsg_type;
  1242. if (type > RTM_MAX)
  1243. return -EOPNOTSUPP;
  1244. type -= RTM_BASE;
  1245. /* All the messages must have at least 1 byte length */
  1246. if (nlh->nlmsg_len < NLMSG_LENGTH(sizeof(struct rtgenmsg)))
  1247. return 0;
  1248. family = ((struct rtgenmsg *)NLMSG_DATA(nlh))->rtgen_family;
  1249. if (family >= NPROTO)
  1250. return -EAFNOSUPPORT;
  1251. sz_idx = type>>2;
  1252. kind = type&3;
  1253. if (kind != 2 && security_netlink_recv(skb, CAP_NET_ADMIN))
  1254. return -EPERM;
  1255. if (kind == 2 && nlh->nlmsg_flags&NLM_F_DUMP) {
  1256. struct sock *rtnl;
  1257. rtnl_dumpit_func dumpit;
  1258. dumpit = rtnl_get_dumpit(family, type);
  1259. if (dumpit == NULL)
  1260. return -EOPNOTSUPP;
  1261. __rtnl_unlock();
  1262. rtnl = net->rtnl;
  1263. err = netlink_dump_start(rtnl, skb, nlh, dumpit, NULL);
  1264. rtnl_lock();
  1265. return err;
  1266. }
  1267. memset(rta_buf, 0, (rtattr_max * sizeof(struct rtattr *)));
  1268. min_len = rtm_min[sz_idx];
  1269. if (nlh->nlmsg_len < min_len)
  1270. return -EINVAL;
  1271. if (nlh->nlmsg_len > min_len) {
  1272. int attrlen = nlh->nlmsg_len - NLMSG_ALIGN(min_len);
  1273. struct rtattr *attr = (void *)nlh + NLMSG_ALIGN(min_len);
  1274. while (RTA_OK(attr, attrlen)) {
  1275. unsigned flavor = attr->rta_type;
  1276. if (flavor) {
  1277. if (flavor > rta_max[sz_idx])
  1278. return -EINVAL;
  1279. rta_buf[flavor-1] = attr;
  1280. }
  1281. attr = RTA_NEXT(attr, attrlen);
  1282. }
  1283. }
  1284. doit = rtnl_get_doit(family, type);
  1285. if (doit == NULL)
  1286. return -EOPNOTSUPP;
  1287. return doit(skb, nlh, (void *)&rta_buf[0]);
  1288. }
  1289. static void rtnetlink_rcv(struct sk_buff *skb)
  1290. {
  1291. rtnl_lock();
  1292. netlink_rcv_skb(skb, &rtnetlink_rcv_msg);
  1293. rtnl_unlock();
  1294. }
  1295. static int rtnetlink_event(struct notifier_block *this, unsigned long event, void *ptr)
  1296. {
  1297. struct net_device *dev = ptr;
  1298. switch (event) {
  1299. case NETDEV_UP:
  1300. case NETDEV_DOWN:
  1301. case NETDEV_PRE_UP:
  1302. case NETDEV_POST_INIT:
  1303. case NETDEV_REGISTER:
  1304. case NETDEV_CHANGE:
  1305. case NETDEV_GOING_DOWN:
  1306. case NETDEV_UNREGISTER:
  1307. case NETDEV_UNREGISTER_BATCH:
  1308. break;
  1309. default:
  1310. rtmsg_ifinfo(RTM_NEWLINK, dev, 0);
  1311. break;
  1312. }
  1313. return NOTIFY_DONE;
  1314. }
  1315. static struct notifier_block rtnetlink_dev_notifier = {
  1316. .notifier_call = rtnetlink_event,
  1317. };
  1318. static int __net_init rtnetlink_net_init(struct net *net)
  1319. {
  1320. struct sock *sk;
  1321. sk = netlink_kernel_create(net, NETLINK_ROUTE, RTNLGRP_MAX,
  1322. rtnetlink_rcv, &rtnl_mutex, THIS_MODULE);
  1323. if (!sk)
  1324. return -ENOMEM;
  1325. net->rtnl = sk;
  1326. return 0;
  1327. }
  1328. static void __net_exit rtnetlink_net_exit(struct net *net)
  1329. {
  1330. netlink_kernel_release(net->rtnl);
  1331. net->rtnl = NULL;
  1332. }
  1333. static struct pernet_operations rtnetlink_net_ops = {
  1334. .init = rtnetlink_net_init,
  1335. .exit = rtnetlink_net_exit,
  1336. };
  1337. void __init rtnetlink_init(void)
  1338. {
  1339. int i;
  1340. rtattr_max = 0;
  1341. for (i = 0; i < ARRAY_SIZE(rta_max); i++)
  1342. if (rta_max[i] > rtattr_max)
  1343. rtattr_max = rta_max[i];
  1344. rta_buf = kmalloc(rtattr_max * sizeof(struct rtattr *), GFP_KERNEL);
  1345. if (!rta_buf)
  1346. panic("rtnetlink_init: cannot allocate rta_buf\n");
  1347. if (register_pernet_subsys(&rtnetlink_net_ops))
  1348. panic("rtnetlink_init: cannot initialize rtnetlink\n");
  1349. netlink_set_nonroot(NETLINK_ROUTE, NL_NONROOT_RECV);
  1350. register_netdevice_notifier(&rtnetlink_dev_notifier);
  1351. rtnl_register(PF_UNSPEC, RTM_GETLINK, rtnl_getlink, rtnl_dump_ifinfo);
  1352. rtnl_register(PF_UNSPEC, RTM_SETLINK, rtnl_setlink, NULL);
  1353. rtnl_register(PF_UNSPEC, RTM_NEWLINK, rtnl_newlink, NULL);
  1354. rtnl_register(PF_UNSPEC, RTM_DELLINK, rtnl_dellink, NULL);
  1355. rtnl_register(PF_UNSPEC, RTM_GETADDR, NULL, rtnl_dump_all);
  1356. rtnl_register(PF_UNSPEC, RTM_GETROUTE, NULL, rtnl_dump_all);
  1357. }