loopback.c 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300
  1. /*
  2. * INET An implementation of the TCP/IP protocol suite for the LINUX
  3. * operating system. INET is implemented using the BSD Socket
  4. * interface as the means of communication with the user level.
  5. *
  6. * Pseudo-driver for the loopback interface.
  7. *
  8. * Version: @(#)loopback.c 1.0.4b 08/16/93
  9. *
  10. * Authors: Ross Biro
  11. * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
  12. * Donald Becker, <becker@scyld.com>
  13. *
  14. * Alan Cox : Fixed oddments for NET3.014
  15. * Alan Cox : Rejig for NET3.029 snap #3
  16. * Alan Cox : Fixed NET3.029 bugs and sped up
  17. * Larry McVoy : Tiny tweak to double performance
  18. * Alan Cox : Backed out LMV's tweak - the linux mm
  19. * can't take it...
  20. * Michael Griffith: Don't bother computing the checksums
  21. * on packets received on the loopback
  22. * interface.
  23. * Alexey Kuznetsov: Potential hang under some extreme
  24. * cases removed.
  25. *
  26. * This program is free software; you can redistribute it and/or
  27. * modify it under the terms of the GNU General Public License
  28. * as published by the Free Software Foundation; either version
  29. * 2 of the License, or (at your option) any later version.
  30. */
  31. #include <linux/kernel.h>
  32. #include <linux/jiffies.h>
  33. #include <linux/module.h>
  34. #include <linux/interrupt.h>
  35. #include <linux/fs.h>
  36. #include <linux/types.h>
  37. #include <linux/string.h>
  38. #include <linux/socket.h>
  39. #include <linux/errno.h>
  40. #include <linux/fcntl.h>
  41. #include <linux/in.h>
  42. #include <linux/init.h>
  43. #include <asm/system.h>
  44. #include <asm/uaccess.h>
  45. #include <asm/io.h>
  46. #include <linux/inet.h>
  47. #include <linux/netdevice.h>
  48. #include <linux/etherdevice.h>
  49. #include <linux/skbuff.h>
  50. #include <linux/ethtool.h>
  51. #include <net/sock.h>
  52. #include <net/checksum.h>
  53. #include <linux/if_ether.h> /* For the statistics structure. */
  54. #include <linux/if_arp.h> /* For ARPHRD_ETHER */
  55. #include <linux/ip.h>
  56. #include <linux/tcp.h>
  57. #include <linux/percpu.h>
  58. #include <net/net_namespace.h>
  59. struct pcpu_lstats {
  60. unsigned long packets;
  61. unsigned long bytes;
  62. };
  63. #define LOOPBACK_OVERHEAD (128 + MAX_HEADER + 16 + 16)
  64. /* KISS: just allocate small chunks and copy bits.
  65. *
  66. * So, in fact, this is documentation, explaining what we expect
  67. * of largesending device modulo TCP checksum, which is ignored for loopback.
  68. */
  69. #ifdef LOOPBACK_TSO
  70. static void emulate_large_send_offload(struct sk_buff *skb)
  71. {
  72. struct iphdr *iph = ip_hdr(skb);
  73. struct tcphdr *th = (struct tcphdr *)(skb_network_header(skb) +
  74. (iph->ihl * 4));
  75. unsigned int doffset = (iph->ihl + th->doff) * 4;
  76. unsigned int mtu = skb_shinfo(skb)->gso_size + doffset;
  77. unsigned int offset = 0;
  78. u32 seq = ntohl(th->seq);
  79. u16 id = ntohs(iph->id);
  80. while (offset + doffset < skb->len) {
  81. unsigned int frag_size = min(mtu, skb->len - offset) - doffset;
  82. struct sk_buff *nskb = alloc_skb(mtu + 32, GFP_ATOMIC);
  83. if (!nskb)
  84. break;
  85. skb_reserve(nskb, 32);
  86. skb_set_mac_header(nskb, -ETH_HLEN);
  87. skb_reset_network_header(nskb);
  88. iph = ip_hdr(nskb);
  89. skb_copy_to_linear_data(nskb, skb_network_header(skb),
  90. doffset);
  91. if (skb_copy_bits(skb,
  92. doffset + offset,
  93. nskb->data + doffset,
  94. frag_size))
  95. BUG();
  96. skb_put(nskb, doffset + frag_size);
  97. nskb->ip_summed = CHECKSUM_UNNECESSARY;
  98. nskb->dev = skb->dev;
  99. nskb->priority = skb->priority;
  100. nskb->protocol = skb->protocol;
  101. nskb->dst = dst_clone(skb->dst);
  102. memcpy(nskb->cb, skb->cb, sizeof(skb->cb));
  103. nskb->pkt_type = skb->pkt_type;
  104. th = (struct tcphdr *)(skb_network_header(nskb) + iph->ihl * 4);
  105. iph->tot_len = htons(frag_size + doffset);
  106. iph->id = htons(id);
  107. iph->check = 0;
  108. iph->check = ip_fast_csum((unsigned char *) iph, iph->ihl);
  109. th->seq = htonl(seq);
  110. if (offset + doffset + frag_size < skb->len)
  111. th->fin = th->psh = 0;
  112. netif_rx(nskb);
  113. offset += frag_size;
  114. seq += frag_size;
  115. id++;
  116. }
  117. dev_kfree_skb(skb);
  118. }
  119. #endif /* LOOPBACK_TSO */
  120. /*
  121. * The higher levels take care of making this non-reentrant (it's
  122. * called with bh's disabled).
  123. */
  124. static int loopback_xmit(struct sk_buff *skb, struct net_device *dev)
  125. {
  126. struct pcpu_lstats *pcpu_lstats, *lb_stats;
  127. skb_orphan(skb);
  128. skb->protocol = eth_type_trans(skb,dev);
  129. #ifndef LOOPBACK_MUST_CHECKSUM
  130. skb->ip_summed = CHECKSUM_UNNECESSARY;
  131. #endif
  132. #ifdef LOOPBACK_TSO
  133. if (skb_is_gso(skb)) {
  134. BUG_ON(skb->protocol != htons(ETH_P_IP));
  135. BUG_ON(ip_hdr(skb)->protocol != IPPROTO_TCP);
  136. emulate_large_send_offload(skb);
  137. return 0;
  138. }
  139. #endif
  140. dev->last_rx = jiffies;
  141. /* it's OK to use per_cpu_ptr() because BHs are off */
  142. pcpu_lstats = netdev_priv(dev);
  143. lb_stats = per_cpu_ptr(pcpu_lstats, smp_processor_id());
  144. lb_stats->bytes += skb->len;
  145. lb_stats->packets++;
  146. netif_rx(skb);
  147. return 0;
  148. }
  149. static struct net_device_stats *get_stats(struct net_device *dev)
  150. {
  151. const struct pcpu_lstats *pcpu_lstats;
  152. struct net_device_stats *stats = &dev->stats;
  153. unsigned long bytes = 0;
  154. unsigned long packets = 0;
  155. int i;
  156. pcpu_lstats = netdev_priv(dev);
  157. for_each_possible_cpu(i) {
  158. const struct pcpu_lstats *lb_stats;
  159. lb_stats = per_cpu_ptr(pcpu_lstats, i);
  160. bytes += lb_stats->bytes;
  161. packets += lb_stats->packets;
  162. }
  163. stats->rx_packets = packets;
  164. stats->tx_packets = packets;
  165. stats->rx_bytes = bytes;
  166. stats->tx_bytes = bytes;
  167. return stats;
  168. }
  169. static u32 always_on(struct net_device *dev)
  170. {
  171. return 1;
  172. }
  173. static const struct ethtool_ops loopback_ethtool_ops = {
  174. .get_link = always_on,
  175. .set_tso = ethtool_op_set_tso,
  176. .get_tx_csum = always_on,
  177. .get_sg = always_on,
  178. .get_rx_csum = always_on,
  179. };
  180. static int loopback_dev_init(struct net_device *dev)
  181. {
  182. struct pcpu_lstats *lstats;
  183. lstats = alloc_percpu(struct pcpu_lstats);
  184. if (!lstats)
  185. return -ENOMEM;
  186. dev->priv = lstats;
  187. return 0;
  188. }
  189. static void loopback_dev_free(struct net_device *dev)
  190. {
  191. struct pcpu_lstats *lstats = netdev_priv(dev);
  192. free_percpu(lstats);
  193. free_netdev(dev);
  194. }
  195. /*
  196. * The loopback device is special. There is only one instance
  197. * per network namespace.
  198. */
  199. static void loopback_setup(struct net_device *dev)
  200. {
  201. dev->get_stats = &get_stats;
  202. dev->mtu = (16 * 1024) + 20 + 20 + 12;
  203. dev->hard_start_xmit = loopback_xmit;
  204. dev->hard_header_len = ETH_HLEN; /* 14 */
  205. dev->addr_len = ETH_ALEN; /* 6 */
  206. dev->tx_queue_len = 0;
  207. dev->type = ARPHRD_LOOPBACK; /* 0x0001*/
  208. dev->flags = IFF_LOOPBACK;
  209. dev->features = NETIF_F_SG | NETIF_F_FRAGLIST
  210. #ifdef LOOPBACK_TSO
  211. | NETIF_F_TSO
  212. #endif
  213. | NETIF_F_NO_CSUM
  214. | NETIF_F_HIGHDMA
  215. | NETIF_F_LLTX
  216. | NETIF_F_NETNS_LOCAL,
  217. dev->ethtool_ops = &loopback_ethtool_ops;
  218. dev->header_ops = &eth_header_ops;
  219. dev->init = loopback_dev_init;
  220. dev->destructor = loopback_dev_free;
  221. }
  222. /* Setup and register the loopback device. */
  223. static __net_init int loopback_net_init(struct net *net)
  224. {
  225. struct net_device *dev;
  226. int err;
  227. err = -ENOMEM;
  228. dev = alloc_netdev(0, "lo", loopback_setup);
  229. if (!dev)
  230. goto out;
  231. dev->nd_net = net;
  232. err = register_netdev(dev);
  233. if (err)
  234. goto out_free_netdev;
  235. net->loopback_dev = dev;
  236. return 0;
  237. out_free_netdev:
  238. free_netdev(dev);
  239. out:
  240. if (net == &init_net)
  241. panic("loopback: Failed to register netdevice: %d\n", err);
  242. return err;
  243. }
  244. static __net_exit void loopback_net_exit(struct net *net)
  245. {
  246. struct net_device *dev = net->loopback_dev;
  247. unregister_netdev(dev);
  248. }
  249. static struct pernet_operations __net_initdata loopback_net_ops = {
  250. .init = loopback_net_init,
  251. .exit = loopback_net_exit,
  252. };
  253. static int __init loopback_init(void)
  254. {
  255. return register_pernet_device(&loopback_net_ops);
  256. }
  257. /* Loopback is special. It should be initialized before any other network
  258. * device and network subsystem.
  259. */
  260. fs_initcall(loopback_init);