ll_poll.h 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202
  1. /*
  2. * Low Latency Sockets
  3. * Copyright(c) 2013 Intel Corporation.
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms and conditions of the GNU General Public License,
  7. * version 2, as published by the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope it will be useful, but WITHOUT
  10. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  12. * more details.
  13. *
  14. * You should have received a copy of the GNU General Public License along with
  15. * this program; if not, write to the Free Software Foundation, Inc.,
  16. * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
  17. *
  18. * Author: Eliezer Tamir
  19. *
  20. * Contact Information:
  21. * e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
  22. */
  23. #ifndef _LINUX_NET_LL_POLL_H
  24. #define _LINUX_NET_LL_POLL_H
  25. #include <linux/netdevice.h>
  26. #include <net/ip.h>
  27. #ifdef CONFIG_NET_LL_RX_POLL
  28. struct napi_struct;
  29. extern unsigned int sysctl_net_ll_read __read_mostly;
  30. extern unsigned int sysctl_net_ll_poll __read_mostly;
  31. /* return values from ndo_ll_poll */
  32. #define LL_FLUSH_FAILED -1
  33. #define LL_FLUSH_BUSY -2
  34. static inline bool net_busy_loop_on(void)
  35. {
  36. return sysctl_net_ll_poll;
  37. }
  38. /* a wrapper to make debug_smp_processor_id() happy
  39. * we can use sched_clock() because we don't care much about precision
  40. * we only care that the average is bounded
  41. */
  42. #ifdef CONFIG_DEBUG_PREEMPT
  43. static inline u64 busy_loop_sched_clock(void)
  44. {
  45. u64 rc;
  46. preempt_disable_notrace();
  47. rc = sched_clock();
  48. preempt_enable_no_resched_notrace();
  49. return rc;
  50. }
  51. #else /* CONFIG_DEBUG_PREEMPT */
  52. static inline u64 busy_loop_sched_clock(void)
  53. {
  54. return sched_clock();
  55. }
  56. #endif /* CONFIG_DEBUG_PREEMPT */
  57. /* we don't mind a ~2.5% imprecision so <<10 instead of *1000
  58. * sk->sk_ll_usec is a u_int so this can't overflow
  59. */
  60. static inline u64 sk_busy_loop_end_time(struct sock *sk)
  61. {
  62. return (u64)ACCESS_ONCE(sk->sk_ll_usec) << 10;
  63. }
  64. /* in poll/select we use the global sysctl_net_ll_poll value
  65. * only call sched_clock() if enabled
  66. */
  67. static inline u64 busy_loop_end_time(void)
  68. {
  69. return (u64)ACCESS_ONCE(sysctl_net_ll_poll) << 10;
  70. }
  71. /* if flag is not set we don't need to know the time
  72. * so we want to avoid a potentially expensive sched_clock()
  73. */
  74. static inline u64 busy_loop_start_time(unsigned int flag)
  75. {
  76. return flag ? busy_loop_sched_clock() : 0;
  77. }
  78. static inline bool sk_can_busy_loop(struct sock *sk)
  79. {
  80. return sk->sk_ll_usec && sk->sk_napi_id &&
  81. !need_resched() && !signal_pending(current);
  82. }
  83. /* careful! time_in_range64 will evaluate now twice */
  84. static inline bool busy_loop_range(u64 start_time, u64 run_time)
  85. {
  86. u64 now = busy_loop_sched_clock();
  87. return time_in_range64(now, start_time, start_time + run_time);
  88. }
  89. /* when used in sock_poll() nonblock is known at compile time to be true
  90. * so the loop and end_time will be optimized out
  91. */
  92. static inline bool sk_busy_loop(struct sock *sk, int nonblock)
  93. {
  94. u64 start_time = busy_loop_start_time(!nonblock);
  95. u64 end_time = sk_busy_loop_end_time(sk);
  96. const struct net_device_ops *ops;
  97. struct napi_struct *napi;
  98. int rc = false;
  99. /*
  100. * rcu read lock for napi hash
  101. * bh so we don't race with net_rx_action
  102. */
  103. rcu_read_lock_bh();
  104. napi = napi_by_id(sk->sk_napi_id);
  105. if (!napi)
  106. goto out;
  107. ops = napi->dev->netdev_ops;
  108. if (!ops->ndo_ll_poll)
  109. goto out;
  110. do {
  111. rc = ops->ndo_ll_poll(napi);
  112. if (rc == LL_FLUSH_FAILED)
  113. break; /* permanent failure */
  114. if (rc > 0)
  115. /* local bh are disabled so it is ok to use _BH */
  116. NET_ADD_STATS_BH(sock_net(sk),
  117. LINUX_MIB_LOWLATENCYRXPACKETS, rc);
  118. } while (!nonblock && skb_queue_empty(&sk->sk_receive_queue) &&
  119. busy_loop_range(start_time, end_time));
  120. rc = !skb_queue_empty(&sk->sk_receive_queue);
  121. out:
  122. rcu_read_unlock_bh();
  123. return rc;
  124. }
  125. /* used in the NIC receive handler to mark the skb */
  126. static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
  127. {
  128. skb->napi_id = napi->napi_id;
  129. }
  130. /* used in the protocol hanlder to propagate the napi_id to the socket */
  131. static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
  132. {
  133. sk->sk_napi_id = skb->napi_id;
  134. }
  135. #else /* CONFIG_NET_LL_RX_POLL */
  136. static inline unsigned long net_busy_loop_on(void)
  137. {
  138. return 0;
  139. }
  140. static inline u64 busy_loop_start_time(unsigned int flag)
  141. {
  142. return 0;
  143. }
  144. static inline u64 busy_loop_end_time(void)
  145. {
  146. return 0;
  147. }
  148. static inline bool sk_can_busy_loop(struct sock *sk)
  149. {
  150. return false;
  151. }
  152. static inline bool sk_busy_poll(struct sock *sk, int nonblock)
  153. {
  154. return false;
  155. }
  156. static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
  157. {
  158. }
  159. static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
  160. {
  161. }
  162. static inline bool busy_loop_range(u64 start_time, u64 run_time)
  163. {
  164. return false;
  165. }
  166. #endif /* CONFIG_NET_LL_RX_POLL */
  167. #endif /* _LINUX_NET_LL_POLL_H */