gre_demux.c 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385
  1. /*
  2. * GRE over IPv4 demultiplexer driver
  3. *
  4. * Authors: Dmitry Kozlov (xeb@mail.ru)
  5. *
  6. * This program is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU General Public License
  8. * as published by the Free Software Foundation; either version
  9. * 2 of the License, or (at your option) any later version.
  10. *
  11. */
  12. #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  13. #include <linux/module.h>
  14. #include <linux/if.h>
  15. #include <linux/icmp.h>
  16. #include <linux/kernel.h>
  17. #include <linux/kmod.h>
  18. #include <linux/skbuff.h>
  19. #include <linux/in.h>
  20. #include <linux/ip.h>
  21. #include <linux/netdevice.h>
  22. #include <linux/if_tunnel.h>
  23. #include <linux/spinlock.h>
  24. #include <net/protocol.h>
  25. #include <net/gre.h>
  26. #include <net/icmp.h>
  27. #include <net/route.h>
  28. #include <net/xfrm.h>
  29. static const struct gre_protocol __rcu *gre_proto[GREPROTO_MAX] __read_mostly;
  30. static struct gre_cisco_protocol __rcu *gre_cisco_proto_list[GRE_IP_PROTO_MAX];
  31. int gre_add_protocol(const struct gre_protocol *proto, u8 version)
  32. {
  33. if (version >= GREPROTO_MAX)
  34. return -EINVAL;
  35. return (cmpxchg((const struct gre_protocol **)&gre_proto[version], NULL, proto) == NULL) ?
  36. 0 : -EBUSY;
  37. }
  38. EXPORT_SYMBOL_GPL(gre_add_protocol);
  39. int gre_del_protocol(const struct gre_protocol *proto, u8 version)
  40. {
  41. int ret;
  42. if (version >= GREPROTO_MAX)
  43. return -EINVAL;
  44. ret = (cmpxchg((const struct gre_protocol **)&gre_proto[version], proto, NULL) == proto) ?
  45. 0 : -EBUSY;
  46. if (ret)
  47. return ret;
  48. synchronize_rcu();
  49. return 0;
  50. }
  51. EXPORT_SYMBOL_GPL(gre_del_protocol);
  52. void gre_build_header(struct sk_buff *skb, const struct tnl_ptk_info *tpi,
  53. int hdr_len)
  54. {
  55. struct gre_base_hdr *greh;
  56. skb_push(skb, hdr_len);
  57. greh = (struct gre_base_hdr *)skb->data;
  58. greh->flags = tnl_flags_to_gre_flags(tpi->flags);
  59. greh->protocol = tpi->proto;
  60. if (tpi->flags&(TUNNEL_KEY|TUNNEL_CSUM|TUNNEL_SEQ)) {
  61. __be32 *ptr = (__be32 *)(((u8 *)greh) + hdr_len - 4);
  62. if (tpi->flags&TUNNEL_SEQ) {
  63. *ptr = tpi->seq;
  64. ptr--;
  65. }
  66. if (tpi->flags&TUNNEL_KEY) {
  67. *ptr = tpi->key;
  68. ptr--;
  69. }
  70. if (tpi->flags&TUNNEL_CSUM &&
  71. !(skb_shinfo(skb)->gso_type & SKB_GSO_GRE)) {
  72. *ptr = 0;
  73. *(__sum16 *)ptr = csum_fold(skb_checksum(skb, 0,
  74. skb->len, 0));
  75. }
  76. }
  77. }
  78. EXPORT_SYMBOL_GPL(gre_build_header);
  79. static __sum16 check_checksum(struct sk_buff *skb)
  80. {
  81. __sum16 csum = 0;
  82. switch (skb->ip_summed) {
  83. case CHECKSUM_COMPLETE:
  84. csum = csum_fold(skb->csum);
  85. if (!csum)
  86. break;
  87. /* Fall through. */
  88. case CHECKSUM_NONE:
  89. skb->csum = 0;
  90. csum = __skb_checksum_complete(skb);
  91. skb->ip_summed = CHECKSUM_COMPLETE;
  92. break;
  93. }
  94. return csum;
  95. }
  96. static int parse_gre_header(struct sk_buff *skb, struct tnl_ptk_info *tpi,
  97. bool *csum_err)
  98. {
  99. unsigned int ip_hlen = ip_hdrlen(skb);
  100. const struct gre_base_hdr *greh;
  101. __be32 *options;
  102. int hdr_len;
  103. if (unlikely(!pskb_may_pull(skb, sizeof(struct gre_base_hdr))))
  104. return -EINVAL;
  105. greh = (struct gre_base_hdr *)(skb_network_header(skb) + ip_hlen);
  106. if (unlikely(greh->flags & (GRE_VERSION | GRE_ROUTING)))
  107. return -EINVAL;
  108. tpi->flags = gre_flags_to_tnl_flags(greh->flags);
  109. hdr_len = ip_gre_calc_hlen(tpi->flags);
  110. if (!pskb_may_pull(skb, hdr_len))
  111. return -EINVAL;
  112. greh = (struct gre_base_hdr *)(skb_network_header(skb) + ip_hlen);
  113. tpi->proto = greh->protocol;
  114. options = (__be32 *)(greh + 1);
  115. if (greh->flags & GRE_CSUM) {
  116. if (check_checksum(skb)) {
  117. *csum_err = true;
  118. return -EINVAL;
  119. }
  120. options++;
  121. }
  122. if (greh->flags & GRE_KEY) {
  123. tpi->key = *options;
  124. options++;
  125. } else
  126. tpi->key = 0;
  127. if (unlikely(greh->flags & GRE_SEQ)) {
  128. tpi->seq = *options;
  129. options++;
  130. } else
  131. tpi->seq = 0;
  132. /* WCCP version 1 and 2 protocol decoding.
  133. * - Change protocol to IP
  134. * - When dealing with WCCPv2, Skip extra 4 bytes in GRE header
  135. */
  136. if (greh->flags == 0 && tpi->proto == htons(ETH_P_WCCP)) {
  137. tpi->proto = htons(ETH_P_IP);
  138. if ((*(u8 *)options & 0xF0) != 0x40) {
  139. hdr_len += 4;
  140. if (!pskb_may_pull(skb, hdr_len))
  141. return -EINVAL;
  142. }
  143. }
  144. return iptunnel_pull_header(skb, hdr_len, tpi->proto);
  145. }
  146. static int gre_cisco_rcv(struct sk_buff *skb)
  147. {
  148. struct tnl_ptk_info tpi;
  149. int i;
  150. bool csum_err = false;
  151. if (parse_gre_header(skb, &tpi, &csum_err) < 0)
  152. goto drop;
  153. rcu_read_lock();
  154. for (i = 0; i < GRE_IP_PROTO_MAX; i++) {
  155. struct gre_cisco_protocol *proto;
  156. int ret;
  157. proto = rcu_dereference(gre_cisco_proto_list[i]);
  158. if (!proto)
  159. continue;
  160. ret = proto->handler(skb, &tpi);
  161. if (ret == PACKET_RCVD) {
  162. rcu_read_unlock();
  163. return 0;
  164. }
  165. }
  166. rcu_read_unlock();
  167. icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
  168. drop:
  169. kfree_skb(skb);
  170. return 0;
  171. }
  172. static void gre_cisco_err(struct sk_buff *skb, u32 info)
  173. {
  174. /* All the routers (except for Linux) return only
  175. * 8 bytes of packet payload. It means, that precise relaying of
  176. * ICMP in the real Internet is absolutely infeasible.
  177. *
  178. * Moreover, Cisco "wise men" put GRE key to the third word
  179. * in GRE header. It makes impossible maintaining even soft
  180. * state for keyed
  181. * GRE tunnels with enabled checksum. Tell them "thank you".
  182. *
  183. * Well, I wonder, rfc1812 was written by Cisco employee,
  184. * what the hell these idiots break standards established
  185. * by themselves???
  186. */
  187. const int type = icmp_hdr(skb)->type;
  188. const int code = icmp_hdr(skb)->code;
  189. struct tnl_ptk_info tpi;
  190. bool csum_err = false;
  191. int i;
  192. if (parse_gre_header(skb, &tpi, &csum_err)) {
  193. if (!csum_err) /* ignore csum errors. */
  194. return;
  195. }
  196. if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
  197. ipv4_update_pmtu(skb, dev_net(skb->dev), info,
  198. skb->dev->ifindex, 0, IPPROTO_GRE, 0);
  199. return;
  200. }
  201. if (type == ICMP_REDIRECT) {
  202. ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex, 0,
  203. IPPROTO_GRE, 0);
  204. return;
  205. }
  206. rcu_read_lock();
  207. for (i = 0; i < GRE_IP_PROTO_MAX; i++) {
  208. struct gre_cisco_protocol *proto;
  209. proto = rcu_dereference(gre_cisco_proto_list[i]);
  210. if (!proto)
  211. continue;
  212. if (proto->err_handler(skb, info, &tpi) == PACKET_RCVD)
  213. goto out;
  214. }
  215. out:
  216. rcu_read_unlock();
  217. }
  218. static int gre_rcv(struct sk_buff *skb)
  219. {
  220. const struct gre_protocol *proto;
  221. u8 ver;
  222. int ret;
  223. if (!pskb_may_pull(skb, 12))
  224. goto drop;
  225. ver = skb->data[1]&0x7f;
  226. if (ver >= GREPROTO_MAX)
  227. goto drop;
  228. rcu_read_lock();
  229. proto = rcu_dereference(gre_proto[ver]);
  230. if (!proto || !proto->handler)
  231. goto drop_unlock;
  232. ret = proto->handler(skb);
  233. rcu_read_unlock();
  234. return ret;
  235. drop_unlock:
  236. rcu_read_unlock();
  237. drop:
  238. kfree_skb(skb);
  239. return NET_RX_DROP;
  240. }
  241. static void gre_err(struct sk_buff *skb, u32 info)
  242. {
  243. const struct gre_protocol *proto;
  244. const struct iphdr *iph = (const struct iphdr *)skb->data;
  245. u8 ver = skb->data[(iph->ihl<<2) + 1]&0x7f;
  246. if (ver >= GREPROTO_MAX)
  247. return;
  248. rcu_read_lock();
  249. proto = rcu_dereference(gre_proto[ver]);
  250. if (proto && proto->err_handler)
  251. proto->err_handler(skb, info);
  252. rcu_read_unlock();
  253. }
  254. static const struct net_protocol net_gre_protocol = {
  255. .handler = gre_rcv,
  256. .err_handler = gre_err,
  257. .netns_ok = 1,
  258. };
  259. static const struct gre_protocol ipgre_protocol = {
  260. .handler = gre_cisco_rcv,
  261. .err_handler = gre_cisco_err,
  262. };
  263. int gre_cisco_register(struct gre_cisco_protocol *newp)
  264. {
  265. struct gre_cisco_protocol **proto = (struct gre_cisco_protocol **)
  266. &gre_cisco_proto_list[newp->priority];
  267. return (cmpxchg(proto, NULL, newp) == NULL) ? 0 : -EBUSY;
  268. }
  269. EXPORT_SYMBOL_GPL(gre_cisco_register);
  270. int gre_cisco_unregister(struct gre_cisco_protocol *del_proto)
  271. {
  272. struct gre_cisco_protocol **proto = (struct gre_cisco_protocol **)
  273. &gre_cisco_proto_list[del_proto->priority];
  274. int ret;
  275. ret = (cmpxchg(proto, del_proto, NULL) == del_proto) ? 0 : -EINVAL;
  276. if (ret)
  277. return ret;
  278. synchronize_net();
  279. return 0;
  280. }
  281. EXPORT_SYMBOL_GPL(gre_cisco_unregister);
  282. static int __init gre_init(void)
  283. {
  284. pr_info("GRE over IPv4 demultiplexor driver\n");
  285. if (inet_add_protocol(&net_gre_protocol, IPPROTO_GRE) < 0) {
  286. pr_err("can't add protocol\n");
  287. goto err;
  288. }
  289. if (gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO) < 0) {
  290. pr_info("%s: can't add ipgre handler\n", __func__);
  291. goto err_gre;
  292. }
  293. if (gre_offload_init()) {
  294. pr_err("can't add protocol offload\n");
  295. goto err_gso;
  296. }
  297. return 0;
  298. err_gso:
  299. gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
  300. err_gre:
  301. inet_del_protocol(&net_gre_protocol, IPPROTO_GRE);
  302. err:
  303. return -EAGAIN;
  304. }
  305. static void __exit gre_exit(void)
  306. {
  307. gre_offload_exit();
  308. gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
  309. inet_del_protocol(&net_gre_protocol, IPPROTO_GRE);
  310. }
  311. module_init(gre_init);
  312. module_exit(gre_exit);
  313. MODULE_DESCRIPTION("GRE over IPv4 demultiplexer driver");
  314. MODULE_AUTHOR("D. Kozlov (xeb@mail.ru)");
  315. MODULE_LICENSE("GPL");