ip_options.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647
  1. /*
  2. * INET An implementation of the TCP/IP protocol suite for the LINUX
  3. * operating system. INET is implemented using the BSD Socket
  4. * interface as the means of communication with the user level.
  5. *
  6. * The options processing module for ip.c
  7. *
  8. * Authors: A.N.Kuznetsov
  9. *
  10. */
  11. #include <linux/capability.h>
  12. #include <linux/module.h>
  13. #include <linux/types.h>
  14. #include <asm/uaccess.h>
  15. #include <linux/skbuff.h>
  16. #include <linux/ip.h>
  17. #include <linux/icmp.h>
  18. #include <linux/netdevice.h>
  19. #include <linux/rtnetlink.h>
  20. #include <net/sock.h>
  21. #include <net/ip.h>
  22. #include <net/icmp.h>
  23. #include <net/route.h>
  24. #include <net/cipso_ipv4.h>
  25. /*
  26. * Write options to IP header, record destination address to
  27. * source route option, address of outgoing interface
  28. * (we should already know it, so that this function is allowed be
  29. * called only after routing decision) and timestamp,
  30. * if we originate this datagram.
  31. *
  32. * daddr is real destination address, next hop is recorded in IP header.
  33. * saddr is address of outgoing interface.
  34. */
  35. void ip_options_build(struct sk_buff * skb, struct ip_options * opt,
  36. __be32 daddr, struct rtable *rt, int is_frag)
  37. {
  38. unsigned char *iph = skb_network_header(skb);
  39. memcpy(&(IPCB(skb)->opt), opt, sizeof(struct ip_options));
  40. memcpy(iph+sizeof(struct iphdr), opt->__data, opt->optlen);
  41. opt = &(IPCB(skb)->opt);
  42. if (opt->srr)
  43. memcpy(iph+opt->srr+iph[opt->srr+1]-4, &daddr, 4);
  44. if (!is_frag) {
  45. if (opt->rr_needaddr)
  46. ip_rt_get_source(iph+opt->rr+iph[opt->rr+2]-5, rt);
  47. if (opt->ts_needaddr)
  48. ip_rt_get_source(iph+opt->ts+iph[opt->ts+2]-9, rt);
  49. if (opt->ts_needtime) {
  50. struct timespec tv;
  51. __be32 midtime;
  52. getnstimeofday(&tv);
  53. midtime = htonl((tv.tv_sec % 86400) * MSEC_PER_SEC + tv.tv_nsec / NSEC_PER_MSEC);
  54. memcpy(iph+opt->ts+iph[opt->ts+2]-5, &midtime, 4);
  55. }
  56. return;
  57. }
  58. if (opt->rr) {
  59. memset(iph+opt->rr, IPOPT_NOP, iph[opt->rr+1]);
  60. opt->rr = 0;
  61. opt->rr_needaddr = 0;
  62. }
  63. if (opt->ts) {
  64. memset(iph+opt->ts, IPOPT_NOP, iph[opt->ts+1]);
  65. opt->ts = 0;
  66. opt->ts_needaddr = opt->ts_needtime = 0;
  67. }
  68. }
  69. /*
  70. * Provided (sopt, skb) points to received options,
  71. * build in dopt compiled option set appropriate for answering.
  72. * i.e. invert SRR option, copy anothers,
  73. * and grab room in RR/TS options.
  74. *
  75. * NOTE: dopt cannot point to skb.
  76. */
  77. int ip_options_echo(struct ip_options * dopt, struct sk_buff * skb)
  78. {
  79. struct ip_options *sopt;
  80. unsigned char *sptr, *dptr;
  81. int soffset, doffset;
  82. int optlen;
  83. __be32 daddr;
  84. memset(dopt, 0, sizeof(struct ip_options));
  85. sopt = &(IPCB(skb)->opt);
  86. if (sopt->optlen == 0) {
  87. dopt->optlen = 0;
  88. return 0;
  89. }
  90. sptr = skb_network_header(skb);
  91. dptr = dopt->__data;
  92. daddr = skb->rtable->rt_spec_dst;
  93. if (sopt->rr) {
  94. optlen = sptr[sopt->rr+1];
  95. soffset = sptr[sopt->rr+2];
  96. dopt->rr = dopt->optlen + sizeof(struct iphdr);
  97. memcpy(dptr, sptr+sopt->rr, optlen);
  98. if (sopt->rr_needaddr && soffset <= optlen) {
  99. if (soffset + 3 > optlen)
  100. return -EINVAL;
  101. dptr[2] = soffset + 4;
  102. dopt->rr_needaddr = 1;
  103. }
  104. dptr += optlen;
  105. dopt->optlen += optlen;
  106. }
  107. if (sopt->ts) {
  108. optlen = sptr[sopt->ts+1];
  109. soffset = sptr[sopt->ts+2];
  110. dopt->ts = dopt->optlen + sizeof(struct iphdr);
  111. memcpy(dptr, sptr+sopt->ts, optlen);
  112. if (soffset <= optlen) {
  113. if (sopt->ts_needaddr) {
  114. if (soffset + 3 > optlen)
  115. return -EINVAL;
  116. dopt->ts_needaddr = 1;
  117. soffset += 4;
  118. }
  119. if (sopt->ts_needtime) {
  120. if (soffset + 3 > optlen)
  121. return -EINVAL;
  122. if ((dptr[3]&0xF) != IPOPT_TS_PRESPEC) {
  123. dopt->ts_needtime = 1;
  124. soffset += 4;
  125. } else {
  126. dopt->ts_needtime = 0;
  127. if (soffset + 8 <= optlen) {
  128. __be32 addr;
  129. memcpy(&addr, sptr+soffset-1, 4);
  130. if (inet_addr_type(dev_net(skb->dst->dev), addr) != RTN_LOCAL) {
  131. dopt->ts_needtime = 1;
  132. soffset += 8;
  133. }
  134. }
  135. }
  136. }
  137. dptr[2] = soffset;
  138. }
  139. dptr += optlen;
  140. dopt->optlen += optlen;
  141. }
  142. if (sopt->srr) {
  143. unsigned char * start = sptr+sopt->srr;
  144. __be32 faddr;
  145. optlen = start[1];
  146. soffset = start[2];
  147. doffset = 0;
  148. if (soffset > optlen)
  149. soffset = optlen + 1;
  150. soffset -= 4;
  151. if (soffset > 3) {
  152. memcpy(&faddr, &start[soffset-1], 4);
  153. for (soffset-=4, doffset=4; soffset > 3; soffset-=4, doffset+=4)
  154. memcpy(&dptr[doffset-1], &start[soffset-1], 4);
  155. /*
  156. * RFC1812 requires to fix illegal source routes.
  157. */
  158. if (memcmp(&ip_hdr(skb)->saddr,
  159. &start[soffset + 3], 4) == 0)
  160. doffset -= 4;
  161. }
  162. if (doffset > 3) {
  163. memcpy(&start[doffset-1], &daddr, 4);
  164. dopt->faddr = faddr;
  165. dptr[0] = start[0];
  166. dptr[1] = doffset+3;
  167. dptr[2] = 4;
  168. dptr += doffset+3;
  169. dopt->srr = dopt->optlen + sizeof(struct iphdr);
  170. dopt->optlen += doffset+3;
  171. dopt->is_strictroute = sopt->is_strictroute;
  172. }
  173. }
  174. if (sopt->cipso) {
  175. optlen = sptr[sopt->cipso+1];
  176. dopt->cipso = dopt->optlen+sizeof(struct iphdr);
  177. memcpy(dptr, sptr+sopt->cipso, optlen);
  178. dptr += optlen;
  179. dopt->optlen += optlen;
  180. }
  181. while (dopt->optlen & 3) {
  182. *dptr++ = IPOPT_END;
  183. dopt->optlen++;
  184. }
  185. return 0;
  186. }
  187. /*
  188. * Options "fragmenting", just fill options not
  189. * allowed in fragments with NOOPs.
  190. * Simple and stupid 8), but the most efficient way.
  191. */
  192. void ip_options_fragment(struct sk_buff * skb)
  193. {
  194. unsigned char *optptr = skb_network_header(skb) + sizeof(struct iphdr);
  195. struct ip_options * opt = &(IPCB(skb)->opt);
  196. int l = opt->optlen;
  197. int optlen;
  198. while (l > 0) {
  199. switch (*optptr) {
  200. case IPOPT_END:
  201. return;
  202. case IPOPT_NOOP:
  203. l--;
  204. optptr++;
  205. continue;
  206. }
  207. optlen = optptr[1];
  208. if (optlen<2 || optlen>l)
  209. return;
  210. if (!IPOPT_COPIED(*optptr))
  211. memset(optptr, IPOPT_NOOP, optlen);
  212. l -= optlen;
  213. optptr += optlen;
  214. }
  215. opt->ts = 0;
  216. opt->rr = 0;
  217. opt->rr_needaddr = 0;
  218. opt->ts_needaddr = 0;
  219. opt->ts_needtime = 0;
  220. return;
  221. }
  222. /*
  223. * Verify options and fill pointers in struct options.
  224. * Caller should clear *opt, and set opt->data.
  225. * If opt == NULL, then skb->data should point to IP header.
  226. */
  227. int ip_options_compile(struct net *net,
  228. struct ip_options * opt, struct sk_buff * skb)
  229. {
  230. int l;
  231. unsigned char * iph;
  232. unsigned char * optptr;
  233. int optlen;
  234. unsigned char * pp_ptr = NULL;
  235. struct rtable *rt = NULL;
  236. if (skb != NULL) {
  237. rt = skb->rtable;
  238. optptr = (unsigned char *)&(ip_hdr(skb)[1]);
  239. } else
  240. optptr = opt->__data;
  241. iph = optptr - sizeof(struct iphdr);
  242. for (l = opt->optlen; l > 0; ) {
  243. switch (*optptr) {
  244. case IPOPT_END:
  245. for (optptr++, l--; l>0; optptr++, l--) {
  246. if (*optptr != IPOPT_END) {
  247. *optptr = IPOPT_END;
  248. opt->is_changed = 1;
  249. }
  250. }
  251. goto eol;
  252. case IPOPT_NOOP:
  253. l--;
  254. optptr++;
  255. continue;
  256. }
  257. optlen = optptr[1];
  258. if (optlen<2 || optlen>l) {
  259. pp_ptr = optptr;
  260. goto error;
  261. }
  262. switch (*optptr) {
  263. case IPOPT_SSRR:
  264. case IPOPT_LSRR:
  265. if (optlen < 3) {
  266. pp_ptr = optptr + 1;
  267. goto error;
  268. }
  269. if (optptr[2] < 4) {
  270. pp_ptr = optptr + 2;
  271. goto error;
  272. }
  273. /* NB: cf RFC-1812 5.2.4.1 */
  274. if (opt->srr) {
  275. pp_ptr = optptr;
  276. goto error;
  277. }
  278. if (!skb) {
  279. if (optptr[2] != 4 || optlen < 7 || ((optlen-3) & 3)) {
  280. pp_ptr = optptr + 1;
  281. goto error;
  282. }
  283. memcpy(&opt->faddr, &optptr[3], 4);
  284. if (optlen > 7)
  285. memmove(&optptr[3], &optptr[7], optlen-7);
  286. }
  287. opt->is_strictroute = (optptr[0] == IPOPT_SSRR);
  288. opt->srr = optptr - iph;
  289. break;
  290. case IPOPT_RR:
  291. if (opt->rr) {
  292. pp_ptr = optptr;
  293. goto error;
  294. }
  295. if (optlen < 3) {
  296. pp_ptr = optptr + 1;
  297. goto error;
  298. }
  299. if (optptr[2] < 4) {
  300. pp_ptr = optptr + 2;
  301. goto error;
  302. }
  303. if (optptr[2] <= optlen) {
  304. if (optptr[2]+3 > optlen) {
  305. pp_ptr = optptr + 2;
  306. goto error;
  307. }
  308. if (skb) {
  309. memcpy(&optptr[optptr[2]-1], &rt->rt_spec_dst, 4);
  310. opt->is_changed = 1;
  311. }
  312. optptr[2] += 4;
  313. opt->rr_needaddr = 1;
  314. }
  315. opt->rr = optptr - iph;
  316. break;
  317. case IPOPT_TIMESTAMP:
  318. if (opt->ts) {
  319. pp_ptr = optptr;
  320. goto error;
  321. }
  322. if (optlen < 4) {
  323. pp_ptr = optptr + 1;
  324. goto error;
  325. }
  326. if (optptr[2] < 5) {
  327. pp_ptr = optptr + 2;
  328. goto error;
  329. }
  330. if (optptr[2] <= optlen) {
  331. __be32 *timeptr = NULL;
  332. if (optptr[2]+3 > optptr[1]) {
  333. pp_ptr = optptr + 2;
  334. goto error;
  335. }
  336. switch (optptr[3]&0xF) {
  337. case IPOPT_TS_TSONLY:
  338. opt->ts = optptr - iph;
  339. if (skb)
  340. timeptr = (__be32*)&optptr[optptr[2]-1];
  341. opt->ts_needtime = 1;
  342. optptr[2] += 4;
  343. break;
  344. case IPOPT_TS_TSANDADDR:
  345. if (optptr[2]+7 > optptr[1]) {
  346. pp_ptr = optptr + 2;
  347. goto error;
  348. }
  349. opt->ts = optptr - iph;
  350. if (skb) {
  351. memcpy(&optptr[optptr[2]-1], &rt->rt_spec_dst, 4);
  352. timeptr = (__be32*)&optptr[optptr[2]+3];
  353. }
  354. opt->ts_needaddr = 1;
  355. opt->ts_needtime = 1;
  356. optptr[2] += 8;
  357. break;
  358. case IPOPT_TS_PRESPEC:
  359. if (optptr[2]+7 > optptr[1]) {
  360. pp_ptr = optptr + 2;
  361. goto error;
  362. }
  363. opt->ts = optptr - iph;
  364. {
  365. __be32 addr;
  366. memcpy(&addr, &optptr[optptr[2]-1], 4);
  367. if (inet_addr_type(net, addr) == RTN_UNICAST)
  368. break;
  369. if (skb)
  370. timeptr = (__be32*)&optptr[optptr[2]+3];
  371. }
  372. opt->ts_needtime = 1;
  373. optptr[2] += 8;
  374. break;
  375. default:
  376. if (!skb && !capable(CAP_NET_RAW)) {
  377. pp_ptr = optptr + 3;
  378. goto error;
  379. }
  380. break;
  381. }
  382. if (timeptr) {
  383. struct timespec tv;
  384. __be32 midtime;
  385. getnstimeofday(&tv);
  386. midtime = htonl((tv.tv_sec % 86400) * MSEC_PER_SEC + tv.tv_nsec / NSEC_PER_MSEC);
  387. memcpy(timeptr, &midtime, sizeof(__be32));
  388. opt->is_changed = 1;
  389. }
  390. } else {
  391. unsigned overflow = optptr[3]>>4;
  392. if (overflow == 15) {
  393. pp_ptr = optptr + 3;
  394. goto error;
  395. }
  396. opt->ts = optptr - iph;
  397. if (skb) {
  398. optptr[3] = (optptr[3]&0xF)|((overflow+1)<<4);
  399. opt->is_changed = 1;
  400. }
  401. }
  402. break;
  403. case IPOPT_RA:
  404. if (optlen < 4) {
  405. pp_ptr = optptr + 1;
  406. goto error;
  407. }
  408. if (optptr[2] == 0 && optptr[3] == 0)
  409. opt->router_alert = optptr - iph;
  410. break;
  411. case IPOPT_CIPSO:
  412. if ((!skb && !capable(CAP_NET_RAW)) || opt->cipso) {
  413. pp_ptr = optptr;
  414. goto error;
  415. }
  416. opt->cipso = optptr - iph;
  417. if (cipso_v4_validate(skb, &optptr)) {
  418. pp_ptr = optptr;
  419. goto error;
  420. }
  421. break;
  422. case IPOPT_SEC:
  423. case IPOPT_SID:
  424. default:
  425. if (!skb && !capable(CAP_NET_RAW)) {
  426. pp_ptr = optptr;
  427. goto error;
  428. }
  429. break;
  430. }
  431. l -= optlen;
  432. optptr += optlen;
  433. }
  434. eol:
  435. if (!pp_ptr)
  436. return 0;
  437. error:
  438. if (skb) {
  439. icmp_send(skb, ICMP_PARAMETERPROB, 0, htonl((pp_ptr-iph)<<24));
  440. }
  441. return -EINVAL;
  442. }
  443. /*
  444. * Undo all the changes done by ip_options_compile().
  445. */
  446. void ip_options_undo(struct ip_options * opt)
  447. {
  448. if (opt->srr) {
  449. unsigned char * optptr = opt->__data+opt->srr-sizeof(struct iphdr);
  450. memmove(optptr+7, optptr+3, optptr[1]-7);
  451. memcpy(optptr+3, &opt->faddr, 4);
  452. }
  453. if (opt->rr_needaddr) {
  454. unsigned char * optptr = opt->__data+opt->rr-sizeof(struct iphdr);
  455. optptr[2] -= 4;
  456. memset(&optptr[optptr[2]-1], 0, 4);
  457. }
  458. if (opt->ts) {
  459. unsigned char * optptr = opt->__data+opt->ts-sizeof(struct iphdr);
  460. if (opt->ts_needtime) {
  461. optptr[2] -= 4;
  462. memset(&optptr[optptr[2]-1], 0, 4);
  463. if ((optptr[3]&0xF) == IPOPT_TS_PRESPEC)
  464. optptr[2] -= 4;
  465. }
  466. if (opt->ts_needaddr) {
  467. optptr[2] -= 4;
  468. memset(&optptr[optptr[2]-1], 0, 4);
  469. }
  470. }
  471. }
  472. static struct ip_options *ip_options_get_alloc(const int optlen)
  473. {
  474. return kzalloc(sizeof(struct ip_options) + ((optlen + 3) & ~3),
  475. GFP_KERNEL);
  476. }
  477. static int ip_options_get_finish(struct net *net, struct ip_options **optp,
  478. struct ip_options *opt, int optlen)
  479. {
  480. while (optlen & 3)
  481. opt->__data[optlen++] = IPOPT_END;
  482. opt->optlen = optlen;
  483. if (optlen && ip_options_compile(net, opt, NULL)) {
  484. kfree(opt);
  485. return -EINVAL;
  486. }
  487. kfree(*optp);
  488. *optp = opt;
  489. return 0;
  490. }
  491. int ip_options_get_from_user(struct net *net, struct ip_options **optp,
  492. unsigned char __user *data, int optlen)
  493. {
  494. struct ip_options *opt = ip_options_get_alloc(optlen);
  495. if (!opt)
  496. return -ENOMEM;
  497. if (optlen && copy_from_user(opt->__data, data, optlen)) {
  498. kfree(opt);
  499. return -EFAULT;
  500. }
  501. return ip_options_get_finish(net, optp, opt, optlen);
  502. }
  503. int ip_options_get(struct net *net, struct ip_options **optp,
  504. unsigned char *data, int optlen)
  505. {
  506. struct ip_options *opt = ip_options_get_alloc(optlen);
  507. if (!opt)
  508. return -ENOMEM;
  509. if (optlen)
  510. memcpy(opt->__data, data, optlen);
  511. return ip_options_get_finish(net, optp, opt, optlen);
  512. }
  513. void ip_forward_options(struct sk_buff *skb)
  514. {
  515. struct ip_options * opt = &(IPCB(skb)->opt);
  516. unsigned char * optptr;
  517. struct rtable *rt = skb->rtable;
  518. unsigned char *raw = skb_network_header(skb);
  519. if (opt->rr_needaddr) {
  520. optptr = (unsigned char *)raw + opt->rr;
  521. ip_rt_get_source(&optptr[optptr[2]-5], rt);
  522. opt->is_changed = 1;
  523. }
  524. if (opt->srr_is_hit) {
  525. int srrptr, srrspace;
  526. optptr = raw + opt->srr;
  527. for ( srrptr=optptr[2], srrspace = optptr[1];
  528. srrptr <= srrspace;
  529. srrptr += 4
  530. ) {
  531. if (srrptr + 3 > srrspace)
  532. break;
  533. if (memcmp(&rt->rt_dst, &optptr[srrptr-1], 4) == 0)
  534. break;
  535. }
  536. if (srrptr + 3 <= srrspace) {
  537. opt->is_changed = 1;
  538. ip_rt_get_source(&optptr[srrptr-1], rt);
  539. ip_hdr(skb)->daddr = rt->rt_dst;
  540. optptr[2] = srrptr+4;
  541. } else if (net_ratelimit())
  542. printk(KERN_CRIT "ip_forward(): Argh! Destination lost!\n");
  543. if (opt->ts_needaddr) {
  544. optptr = raw + opt->ts;
  545. ip_rt_get_source(&optptr[optptr[2]-9], rt);
  546. opt->is_changed = 1;
  547. }
  548. }
  549. if (opt->is_changed) {
  550. opt->is_changed = 0;
  551. ip_send_check(ip_hdr(skb));
  552. }
  553. }
  554. int ip_options_rcv_srr(struct sk_buff *skb)
  555. {
  556. struct ip_options *opt = &(IPCB(skb)->opt);
  557. int srrspace, srrptr;
  558. __be32 nexthop;
  559. struct iphdr *iph = ip_hdr(skb);
  560. unsigned char *optptr = skb_network_header(skb) + opt->srr;
  561. struct rtable *rt = skb->rtable;
  562. struct rtable *rt2;
  563. int err;
  564. if (!opt->srr)
  565. return 0;
  566. if (skb->pkt_type != PACKET_HOST)
  567. return -EINVAL;
  568. if (rt->rt_type == RTN_UNICAST) {
  569. if (!opt->is_strictroute)
  570. return 0;
  571. icmp_send(skb, ICMP_PARAMETERPROB, 0, htonl(16<<24));
  572. return -EINVAL;
  573. }
  574. if (rt->rt_type != RTN_LOCAL)
  575. return -EINVAL;
  576. for (srrptr=optptr[2], srrspace = optptr[1]; srrptr <= srrspace; srrptr += 4) {
  577. if (srrptr + 3 > srrspace) {
  578. icmp_send(skb, ICMP_PARAMETERPROB, 0, htonl((opt->srr+2)<<24));
  579. return -EINVAL;
  580. }
  581. memcpy(&nexthop, &optptr[srrptr-1], 4);
  582. rt = skb->rtable;
  583. skb->rtable = NULL;
  584. err = ip_route_input(skb, nexthop, iph->saddr, iph->tos, skb->dev);
  585. rt2 = skb->rtable;
  586. if (err || (rt2->rt_type != RTN_UNICAST && rt2->rt_type != RTN_LOCAL)) {
  587. ip_rt_put(rt2);
  588. skb->rtable = rt;
  589. return -EINVAL;
  590. }
  591. ip_rt_put(rt);
  592. if (rt2->rt_type != RTN_LOCAL)
  593. break;
  594. /* Superfast 8) loopback forward */
  595. memcpy(&iph->daddr, &optptr[srrptr-1], 4);
  596. opt->is_changed = 1;
  597. }
  598. if (srrptr <= srrspace) {
  599. opt->srr_is_hit = 1;
  600. opt->is_changed = 1;
  601. }
  602. return 0;
  603. }