ll_poll.h 4.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. /*
  2. * Low Latency Sockets
  3. * Copyright(c) 2013 Intel Corporation.
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms and conditions of the GNU General Public License,
  7. * version 2, as published by the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope it will be useful, but WITHOUT
  10. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  12. * more details.
  13. *
  14. * You should have received a copy of the GNU General Public License along with
  15. * this program; if not, write to the Free Software Foundation, Inc.,
  16. * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
  17. *
  18. * Author: Eliezer Tamir
  19. *
  20. * Contact Information:
  21. * e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
  22. */
  23. #ifndef _LINUX_NET_LL_POLL_H
  24. #define _LINUX_NET_LL_POLL_H
  25. #include <linux/netdevice.h>
  26. #include <net/ip.h>
  27. #ifdef CONFIG_NET_LL_RX_POLL
  28. struct napi_struct;
  29. extern unsigned int sysctl_net_ll_read __read_mostly;
  30. extern unsigned int sysctl_net_ll_poll __read_mostly;
  31. /* return values from ndo_ll_poll */
  32. #define LL_FLUSH_FAILED -1
  33. #define LL_FLUSH_BUSY -2
  34. static inline unsigned int ll_get_flag(void)
  35. {
  36. return sysctl_net_ll_poll ? POLL_LL : 0;
  37. }
  38. /* a wrapper to make debug_smp_processor_id() happy
  39. * we can use sched_clock() because we don't care much about precision
  40. * we only care that the average is bounded
  41. */
  42. #ifdef CONFIG_DEBUG_PREEMPT
  43. static inline u64 ll_sched_clock(void)
  44. {
  45. u64 rc;
  46. preempt_disable_notrace();
  47. rc = sched_clock();
  48. preempt_enable_no_resched_notrace();
  49. return rc;
  50. }
  51. #else /* CONFIG_DEBUG_PREEMPT */
  52. static inline u64 ll_sched_clock(void)
  53. {
  54. return sched_clock();
  55. }
  56. #endif /* CONFIG_DEBUG_PREEMPT */
  57. /* we don't mind a ~2.5% imprecision so <<10 instead of *1000
  58. * sk->sk_ll_usec is a u_int so this can't overflow
  59. */
  60. static inline u64 ll_sk_end_time(struct sock *sk)
  61. {
  62. return ((u64)ACCESS_ONCE(sk->sk_ll_usec) << 10) + ll_sched_clock();
  63. }
  64. /* in poll/select we use the global sysctl_net_ll_poll value
  65. * only call sched_clock() if enabled
  66. */
  67. static inline u64 ll_end_time(void)
  68. {
  69. u64 end_time = ACCESS_ONCE(sysctl_net_ll_poll);
  70. return end_time ? (end_time << 10) + ll_sched_clock() : 0;
  71. }
  72. static inline bool sk_valid_ll(struct sock *sk)
  73. {
  74. return sk->sk_ll_usec && sk->sk_napi_id &&
  75. !need_resched() && !signal_pending(current);
  76. }
  77. static inline bool can_poll_ll(u64 end_time)
  78. {
  79. return !time_after64(ll_sched_clock(), end_time);
  80. }
  81. /* when used in sock_poll() nonblock is known at compile time to be true
  82. * so the loop and end_time will be optimized out
  83. */
  84. static inline bool sk_poll_ll(struct sock *sk, int nonblock)
  85. {
  86. u64 end_time = nonblock ? 0 : ll_sk_end_time(sk);
  87. const struct net_device_ops *ops;
  88. struct napi_struct *napi;
  89. int rc = false;
  90. /*
  91. * rcu read lock for napi hash
  92. * bh so we don't race with net_rx_action
  93. */
  94. rcu_read_lock_bh();
  95. napi = napi_by_id(sk->sk_napi_id);
  96. if (!napi)
  97. goto out;
  98. ops = napi->dev->netdev_ops;
  99. if (!ops->ndo_ll_poll)
  100. goto out;
  101. do {
  102. rc = ops->ndo_ll_poll(napi);
  103. if (rc == LL_FLUSH_FAILED)
  104. break; /* permanent failure */
  105. if (rc > 0)
  106. /* local bh are disabled so it is ok to use _BH */
  107. NET_ADD_STATS_BH(sock_net(sk),
  108. LINUX_MIB_LOWLATENCYRXPACKETS, rc);
  109. } while (!nonblock && skb_queue_empty(&sk->sk_receive_queue) &&
  110. can_poll_ll(end_time));
  111. rc = !skb_queue_empty(&sk->sk_receive_queue);
  112. out:
  113. rcu_read_unlock_bh();
  114. return rc;
  115. }
  116. /* used in the NIC receive handler to mark the skb */
  117. static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
  118. {
  119. skb->napi_id = napi->napi_id;
  120. }
  121. /* used in the protocol hanlder to propagate the napi_id to the socket */
  122. static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
  123. {
  124. sk->sk_napi_id = skb->napi_id;
  125. }
  126. #else /* CONFIG_NET_LL_RX_POLL */
  127. static inline unsigned long ll_get_flag(void)
  128. {
  129. return 0;
  130. }
  131. static inline u64 sk_ll_end_time(struct sock *sk)
  132. {
  133. return 0;
  134. }
  135. static inline u64 ll_end_time(void)
  136. {
  137. return 0;
  138. }
  139. static inline bool sk_valid_ll(struct sock *sk)
  140. {
  141. return false;
  142. }
  143. static inline bool sk_poll_ll(struct sock *sk, int nonblock)
  144. {
  145. return false;
  146. }
  147. static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
  148. {
  149. }
  150. static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
  151. {
  152. }
  153. static inline bool can_poll_ll(u64 end_time)
  154. {
  155. return false;
  156. }
  157. #endif /* CONFIG_NET_LL_RX_POLL */
  158. #endif /* _LINUX_NET_LL_POLL_H */