xfrm4_policy.c 8.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356
  1. /*
  2. * xfrm4_policy.c
  3. *
  4. * Changes:
  5. * Kazunori MIYAZAWA @USAGI
  6. * YOSHIFUJI Hideaki @USAGI
  7. * Split up af-specific portion
  8. *
  9. */
  10. #include <linux/compiler.h>
  11. #include <linux/inetdevice.h>
  12. #include <net/dst.h>
  13. #include <net/xfrm.h>
  14. #include <net/ip.h>
  15. static struct dst_ops xfrm4_dst_ops;
  16. static struct xfrm_policy_afinfo xfrm4_policy_afinfo;
  17. static int xfrm4_dst_lookup(struct xfrm_dst **dst, struct flowi *fl)
  18. {
  19. return __ip_route_output_key((struct rtable**)dst, fl);
  20. }
  21. static int xfrm4_get_saddr(xfrm_address_t *saddr, xfrm_address_t *daddr)
  22. {
  23. struct rtable *rt;
  24. struct flowi fl_tunnel = {
  25. .nl_u = {
  26. .ip4_u = {
  27. .daddr = daddr->a4,
  28. },
  29. },
  30. };
  31. if (!xfrm4_dst_lookup((struct xfrm_dst **)&rt, &fl_tunnel)) {
  32. saddr->a4 = rt->rt_src;
  33. dst_release(&rt->u.dst);
  34. return 0;
  35. }
  36. return -EHOSTUNREACH;
  37. }
  38. static struct dst_entry *
  39. __xfrm4_find_bundle(struct flowi *fl, struct xfrm_policy *policy)
  40. {
  41. struct dst_entry *dst;
  42. read_lock_bh(&policy->lock);
  43. for (dst = policy->bundles; dst; dst = dst->next) {
  44. struct xfrm_dst *xdst = (struct xfrm_dst*)dst;
  45. if (xdst->u.rt.fl.oif == fl->oif && /*XXX*/
  46. xdst->u.rt.fl.fl4_dst == fl->fl4_dst &&
  47. xdst->u.rt.fl.fl4_src == fl->fl4_src &&
  48. xdst->u.rt.fl.fl4_tos == fl->fl4_tos &&
  49. xfrm_bundle_ok(policy, xdst, fl, AF_INET, 0)) {
  50. dst_clone(dst);
  51. break;
  52. }
  53. }
  54. read_unlock_bh(&policy->lock);
  55. return dst;
  56. }
  57. /* Allocate chain of dst_entry's, attach known xfrm's, calculate
  58. * all the metrics... Shortly, bundle a bundle.
  59. */
  60. static int
  61. __xfrm4_bundle_create(struct xfrm_policy *policy, struct xfrm_state **xfrm, int nx,
  62. struct flowi *fl, struct dst_entry **dst_p)
  63. {
  64. struct dst_entry *dst, *dst_prev;
  65. struct rtable *rt0 = (struct rtable*)(*dst_p);
  66. struct rtable *rt = rt0;
  67. struct flowi fl_tunnel = {
  68. .nl_u = {
  69. .ip4_u = {
  70. .saddr = fl->fl4_src,
  71. .daddr = fl->fl4_dst,
  72. .tos = fl->fl4_tos
  73. }
  74. }
  75. };
  76. int i;
  77. int err;
  78. int header_len = 0;
  79. int trailer_len = 0;
  80. dst = dst_prev = NULL;
  81. dst_hold(&rt->u.dst);
  82. for (i = 0; i < nx; i++) {
  83. struct dst_entry *dst1 = dst_alloc(&xfrm4_dst_ops);
  84. struct xfrm_dst *xdst;
  85. if (unlikely(dst1 == NULL)) {
  86. err = -ENOBUFS;
  87. dst_release(&rt->u.dst);
  88. goto error;
  89. }
  90. if (!dst)
  91. dst = dst1;
  92. else {
  93. dst_prev->child = dst1;
  94. dst1->flags |= DST_NOHASH;
  95. dst_clone(dst1);
  96. }
  97. xdst = (struct xfrm_dst *)dst1;
  98. xdst->route = &rt->u.dst;
  99. xdst->genid = xfrm[i]->genid;
  100. dst1->next = dst_prev;
  101. dst_prev = dst1;
  102. header_len += xfrm[i]->props.header_len;
  103. trailer_len += xfrm[i]->props.trailer_len;
  104. if (xfrm[i]->props.mode != XFRM_MODE_TRANSPORT) {
  105. unsigned short encap_family = xfrm[i]->props.family;
  106. switch (encap_family) {
  107. case AF_INET:
  108. fl_tunnel.fl4_dst = xfrm[i]->id.daddr.a4;
  109. fl_tunnel.fl4_src = xfrm[i]->props.saddr.a4;
  110. break;
  111. #if defined(CONFIG_IPV6) || defined (CONFIG_IPV6_MODULE)
  112. case AF_INET6:
  113. ipv6_addr_copy(&fl_tunnel.fl6_dst, (struct in6_addr*)&xfrm[i]->id.daddr.a6);
  114. ipv6_addr_copy(&fl_tunnel.fl6_src, (struct in6_addr*)&xfrm[i]->props.saddr.a6);
  115. break;
  116. #endif
  117. default:
  118. BUG_ON(1);
  119. }
  120. err = xfrm_dst_lookup((struct xfrm_dst **)&rt,
  121. &fl_tunnel, encap_family);
  122. if (err)
  123. goto error;
  124. } else
  125. dst_hold(&rt->u.dst);
  126. }
  127. dst_prev->child = &rt->u.dst;
  128. dst->path = &rt->u.dst;
  129. /* Copy neighbout for reachability confirmation */
  130. dst->neighbour = neigh_clone(rt->u.dst.neighbour);
  131. *dst_p = dst;
  132. dst = dst_prev;
  133. dst_prev = *dst_p;
  134. i = 0;
  135. err = -ENODEV;
  136. for (; dst_prev != &rt->u.dst; dst_prev = dst_prev->child) {
  137. struct xfrm_dst *x = (struct xfrm_dst*)dst_prev;
  138. x->u.rt.fl = *fl;
  139. dst_prev->xfrm = xfrm[i++];
  140. dst_prev->dev = rt->u.dst.dev;
  141. if (!rt->u.dst.dev)
  142. goto error;
  143. dev_hold(rt->u.dst.dev);
  144. x->u.rt.idev = in_dev_get(rt->u.dst.dev);
  145. if (!x->u.rt.idev)
  146. goto error;
  147. dst_prev->obsolete = -1;
  148. dst_prev->flags |= DST_HOST;
  149. dst_prev->lastuse = jiffies;
  150. dst_prev->header_len = header_len;
  151. dst_prev->trailer_len = trailer_len;
  152. memcpy(&dst_prev->metrics, &x->route->metrics, sizeof(dst_prev->metrics));
  153. dst_prev->input = dst_discard;
  154. dst_prev->output = dst_prev->xfrm->outer_mode->afinfo->output;
  155. if (rt0->peer)
  156. atomic_inc(&rt0->peer->refcnt);
  157. x->u.rt.peer = rt0->peer;
  158. /* Sheit... I remember I did this right. Apparently,
  159. * it was magically lost, so this code needs audit */
  160. x->u.rt.rt_flags = rt0->rt_flags&(RTCF_BROADCAST|RTCF_MULTICAST|RTCF_LOCAL);
  161. x->u.rt.rt_type = rt0->rt_type;
  162. x->u.rt.rt_src = rt0->rt_src;
  163. x->u.rt.rt_dst = rt0->rt_dst;
  164. x->u.rt.rt_gateway = rt0->rt_gateway;
  165. x->u.rt.rt_spec_dst = rt0->rt_spec_dst;
  166. header_len -= x->u.dst.xfrm->props.header_len;
  167. trailer_len -= x->u.dst.xfrm->props.trailer_len;
  168. }
  169. xfrm_init_pmtu(dst);
  170. return 0;
  171. error:
  172. if (dst)
  173. dst_free(dst);
  174. return err;
  175. }
  176. static void
  177. _decode_session4(struct sk_buff *skb, struct flowi *fl)
  178. {
  179. struct iphdr *iph = ip_hdr(skb);
  180. u8 *xprth = skb_network_header(skb) + iph->ihl * 4;
  181. memset(fl, 0, sizeof(struct flowi));
  182. if (!(iph->frag_off & htons(IP_MF | IP_OFFSET))) {
  183. switch (iph->protocol) {
  184. case IPPROTO_UDP:
  185. case IPPROTO_UDPLITE:
  186. case IPPROTO_TCP:
  187. case IPPROTO_SCTP:
  188. case IPPROTO_DCCP:
  189. if (pskb_may_pull(skb, xprth + 4 - skb->data)) {
  190. __be16 *ports = (__be16 *)xprth;
  191. fl->fl_ip_sport = ports[0];
  192. fl->fl_ip_dport = ports[1];
  193. }
  194. break;
  195. case IPPROTO_ICMP:
  196. if (pskb_may_pull(skb, xprth + 2 - skb->data)) {
  197. u8 *icmp = xprth;
  198. fl->fl_icmp_type = icmp[0];
  199. fl->fl_icmp_code = icmp[1];
  200. }
  201. break;
  202. case IPPROTO_ESP:
  203. if (pskb_may_pull(skb, xprth + 4 - skb->data)) {
  204. __be32 *ehdr = (__be32 *)xprth;
  205. fl->fl_ipsec_spi = ehdr[0];
  206. }
  207. break;
  208. case IPPROTO_AH:
  209. if (pskb_may_pull(skb, xprth + 8 - skb->data)) {
  210. __be32 *ah_hdr = (__be32*)xprth;
  211. fl->fl_ipsec_spi = ah_hdr[1];
  212. }
  213. break;
  214. case IPPROTO_COMP:
  215. if (pskb_may_pull(skb, xprth + 4 - skb->data)) {
  216. __be16 *ipcomp_hdr = (__be16 *)xprth;
  217. fl->fl_ipsec_spi = htonl(ntohs(ipcomp_hdr[1]));
  218. }
  219. break;
  220. default:
  221. fl->fl_ipsec_spi = 0;
  222. break;
  223. }
  224. }
  225. fl->proto = iph->protocol;
  226. fl->fl4_dst = iph->daddr;
  227. fl->fl4_src = iph->saddr;
  228. fl->fl4_tos = iph->tos;
  229. }
  230. static inline int xfrm4_garbage_collect(void)
  231. {
  232. xfrm4_policy_afinfo.garbage_collect();
  233. return (atomic_read(&xfrm4_dst_ops.entries) > xfrm4_dst_ops.gc_thresh*2);
  234. }
  235. static void xfrm4_update_pmtu(struct dst_entry *dst, u32 mtu)
  236. {
  237. struct xfrm_dst *xdst = (struct xfrm_dst *)dst;
  238. struct dst_entry *path = xdst->route;
  239. path->ops->update_pmtu(path, mtu);
  240. }
  241. static void xfrm4_dst_destroy(struct dst_entry *dst)
  242. {
  243. struct xfrm_dst *xdst = (struct xfrm_dst *)dst;
  244. if (likely(xdst->u.rt.idev))
  245. in_dev_put(xdst->u.rt.idev);
  246. if (likely(xdst->u.rt.peer))
  247. inet_putpeer(xdst->u.rt.peer);
  248. xfrm_dst_destroy(xdst);
  249. }
  250. static void xfrm4_dst_ifdown(struct dst_entry *dst, struct net_device *dev,
  251. int unregister)
  252. {
  253. struct xfrm_dst *xdst;
  254. if (!unregister)
  255. return;
  256. xdst = (struct xfrm_dst *)dst;
  257. if (xdst->u.rt.idev->dev == dev) {
  258. struct in_device *loopback_idev = in_dev_get(init_net.loopback_dev);
  259. BUG_ON(!loopback_idev);
  260. do {
  261. in_dev_put(xdst->u.rt.idev);
  262. xdst->u.rt.idev = loopback_idev;
  263. in_dev_hold(loopback_idev);
  264. xdst = (struct xfrm_dst *)xdst->u.dst.child;
  265. } while (xdst->u.dst.xfrm);
  266. __in_dev_put(loopback_idev);
  267. }
  268. xfrm_dst_ifdown(dst, dev);
  269. }
  270. static struct dst_ops xfrm4_dst_ops = {
  271. .family = AF_INET,
  272. .protocol = __constant_htons(ETH_P_IP),
  273. .gc = xfrm4_garbage_collect,
  274. .update_pmtu = xfrm4_update_pmtu,
  275. .destroy = xfrm4_dst_destroy,
  276. .ifdown = xfrm4_dst_ifdown,
  277. .gc_thresh = 1024,
  278. .entry_size = sizeof(struct xfrm_dst),
  279. };
  280. static struct xfrm_policy_afinfo xfrm4_policy_afinfo = {
  281. .family = AF_INET,
  282. .dst_ops = &xfrm4_dst_ops,
  283. .dst_lookup = xfrm4_dst_lookup,
  284. .get_saddr = xfrm4_get_saddr,
  285. .find_bundle = __xfrm4_find_bundle,
  286. .bundle_create = __xfrm4_bundle_create,
  287. .decode_session = _decode_session4,
  288. };
  289. static void __init xfrm4_policy_init(void)
  290. {
  291. xfrm_policy_register_afinfo(&xfrm4_policy_afinfo);
  292. }
  293. static void __exit xfrm4_policy_fini(void)
  294. {
  295. xfrm_policy_unregister_afinfo(&xfrm4_policy_afinfo);
  296. }
  297. void __init xfrm4_init(void)
  298. {
  299. xfrm4_state_init();
  300. xfrm4_policy_init();
  301. }