ipoib.h 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376
  1. /*
  2. * Copyright (c) 2004, 2005 Topspin Communications. All rights reserved.
  3. * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
  4. * Copyright (c) 2004 Voltaire, Inc. All rights reserved.
  5. *
  6. * This software is available to you under a choice of one of two
  7. * licenses. You may choose to be licensed under the terms of the GNU
  8. * General Public License (GPL) Version 2, available from the file
  9. * COPYING in the main directory of this source tree, or the
  10. * OpenIB.org BSD license below:
  11. *
  12. * Redistribution and use in source and binary forms, with or
  13. * without modification, are permitted provided that the following
  14. * conditions are met:
  15. *
  16. * - Redistributions of source code must retain the above
  17. * copyright notice, this list of conditions and the following
  18. * disclaimer.
  19. *
  20. * - Redistributions in binary form must reproduce the above
  21. * copyright notice, this list of conditions and the following
  22. * disclaimer in the documentation and/or other materials
  23. * provided with the distribution.
  24. *
  25. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  26. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  27. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  28. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  29. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  30. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  31. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  32. * SOFTWARE.
  33. *
  34. * $Id: ipoib.h 1358 2004-12-17 22:00:11Z roland $
  35. */
  36. #ifndef _IPOIB_H
  37. #define _IPOIB_H
  38. #include <linux/list.h>
  39. #include <linux/skbuff.h>
  40. #include <linux/netdevice.h>
  41. #include <linux/workqueue.h>
  42. #include <linux/pci.h>
  43. #include <linux/config.h>
  44. #include <linux/kref.h>
  45. #include <linux/if_infiniband.h>
  46. #include <linux/mutex.h>
  47. #include <net/neighbour.h>
  48. #include <asm/atomic.h>
  49. #include <rdma/ib_verbs.h>
  50. #include <rdma/ib_pack.h>
  51. #include <rdma/ib_sa.h>
  52. /* constants */
  53. enum {
  54. IPOIB_PACKET_SIZE = 2048,
  55. IPOIB_BUF_SIZE = IPOIB_PACKET_SIZE + IB_GRH_BYTES,
  56. IPOIB_ENCAP_LEN = 4,
  57. IPOIB_RX_RING_SIZE = 128,
  58. IPOIB_TX_RING_SIZE = 64,
  59. IPOIB_NUM_WC = 4,
  60. IPOIB_MAX_PATH_REC_QUEUE = 3,
  61. IPOIB_MAX_MCAST_QUEUE = 3,
  62. IPOIB_FLAG_OPER_UP = 0,
  63. IPOIB_FLAG_INITIALIZED = 1,
  64. IPOIB_FLAG_ADMIN_UP = 2,
  65. IPOIB_PKEY_ASSIGNED = 3,
  66. IPOIB_PKEY_STOP = 4,
  67. IPOIB_FLAG_SUBINTERFACE = 5,
  68. IPOIB_MCAST_RUN = 6,
  69. IPOIB_STOP_REAPER = 7,
  70. IPOIB_MCAST_STARTED = 8,
  71. IPOIB_MAX_BACKOFF_SECONDS = 16,
  72. IPOIB_MCAST_FLAG_FOUND = 0, /* used in set_multicast_list */
  73. IPOIB_MCAST_FLAG_SENDONLY = 1,
  74. IPOIB_MCAST_FLAG_BUSY = 2, /* joining or already joined */
  75. IPOIB_MCAST_FLAG_ATTACHED = 3,
  76. };
  77. /* structs */
  78. struct ipoib_header {
  79. __be16 proto;
  80. u16 reserved;
  81. };
  82. struct ipoib_pseudoheader {
  83. u8 hwaddr[INFINIBAND_ALEN];
  84. };
  85. struct ipoib_mcast;
  86. struct ipoib_rx_buf {
  87. struct sk_buff *skb;
  88. dma_addr_t mapping;
  89. };
  90. struct ipoib_tx_buf {
  91. struct sk_buff *skb;
  92. DECLARE_PCI_UNMAP_ADDR(mapping)
  93. };
  94. /*
  95. * Device private locking: tx_lock protects members used in TX fast
  96. * path (and we use LLTX so upper layers don't do extra locking).
  97. * lock protects everything else. lock nests inside of tx_lock (ie
  98. * tx_lock must be acquired first if needed).
  99. */
  100. struct ipoib_dev_priv {
  101. spinlock_t lock;
  102. struct net_device *dev;
  103. unsigned long flags;
  104. struct mutex mcast_mutex;
  105. struct mutex vlan_mutex;
  106. struct rb_root path_tree;
  107. struct list_head path_list;
  108. struct ipoib_mcast *broadcast;
  109. struct list_head multicast_list;
  110. struct rb_root multicast_tree;
  111. struct work_struct pkey_task;
  112. struct work_struct mcast_task;
  113. struct work_struct flush_task;
  114. struct work_struct restart_task;
  115. struct work_struct ah_reap_task;
  116. struct ib_device *ca;
  117. u8 port;
  118. u16 pkey;
  119. struct ib_pd *pd;
  120. struct ib_mr *mr;
  121. struct ib_cq *cq;
  122. struct ib_qp *qp;
  123. u32 qkey;
  124. union ib_gid local_gid;
  125. u16 local_lid;
  126. u8 local_rate;
  127. unsigned int admin_mtu;
  128. unsigned int mcast_mtu;
  129. struct ipoib_rx_buf *rx_ring;
  130. spinlock_t tx_lock;
  131. struct ipoib_tx_buf *tx_ring;
  132. unsigned tx_head;
  133. unsigned tx_tail;
  134. struct ib_sge tx_sge;
  135. struct ib_send_wr tx_wr;
  136. struct ib_wc ibwc[IPOIB_NUM_WC];
  137. struct list_head dead_ahs;
  138. struct ib_event_handler event_handler;
  139. struct net_device_stats stats;
  140. struct net_device *parent;
  141. struct list_head child_intfs;
  142. struct list_head list;
  143. #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
  144. struct list_head fs_list;
  145. struct dentry *mcg_dentry;
  146. struct dentry *path_dentry;
  147. #endif
  148. };
  149. struct ipoib_ah {
  150. struct net_device *dev;
  151. struct ib_ah *ah;
  152. struct list_head list;
  153. struct kref ref;
  154. unsigned last_send;
  155. };
  156. struct ipoib_path {
  157. struct net_device *dev;
  158. struct ib_sa_path_rec pathrec;
  159. struct ipoib_ah *ah;
  160. struct sk_buff_head queue;
  161. struct list_head neigh_list;
  162. int query_id;
  163. struct ib_sa_query *query;
  164. struct completion done;
  165. struct rb_node rb_node;
  166. struct list_head list;
  167. };
  168. struct ipoib_neigh {
  169. struct ipoib_ah *ah;
  170. struct sk_buff_head queue;
  171. struct neighbour *neighbour;
  172. struct list_head list;
  173. };
  174. /*
  175. * We stash a pointer to our private neighbour information after our
  176. * hardware address in neigh->ha. The ALIGN() expression here makes
  177. * sure that this pointer is stored aligned so that an unaligned
  178. * load is not needed to dereference it.
  179. */
  180. static inline struct ipoib_neigh **to_ipoib_neigh(struct neighbour *neigh)
  181. {
  182. return (void*) neigh + ALIGN(offsetof(struct neighbour, ha) +
  183. INFINIBAND_ALEN, sizeof(void *));
  184. }
  185. extern struct workqueue_struct *ipoib_workqueue;
  186. /* functions */
  187. void ipoib_ib_completion(struct ib_cq *cq, void *dev_ptr);
  188. struct ipoib_ah *ipoib_create_ah(struct net_device *dev,
  189. struct ib_pd *pd, struct ib_ah_attr *attr);
  190. void ipoib_free_ah(struct kref *kref);
  191. static inline void ipoib_put_ah(struct ipoib_ah *ah)
  192. {
  193. kref_put(&ah->ref, ipoib_free_ah);
  194. }
  195. int ipoib_open(struct net_device *dev);
  196. int ipoib_add_pkey_attr(struct net_device *dev);
  197. void ipoib_send(struct net_device *dev, struct sk_buff *skb,
  198. struct ipoib_ah *address, u32 qpn);
  199. void ipoib_reap_ah(void *dev_ptr);
  200. void ipoib_flush_paths(struct net_device *dev);
  201. struct ipoib_dev_priv *ipoib_intf_alloc(const char *format);
  202. int ipoib_ib_dev_init(struct net_device *dev, struct ib_device *ca, int port);
  203. void ipoib_ib_dev_flush(void *dev);
  204. void ipoib_ib_dev_cleanup(struct net_device *dev);
  205. int ipoib_ib_dev_open(struct net_device *dev);
  206. int ipoib_ib_dev_up(struct net_device *dev);
  207. int ipoib_ib_dev_down(struct net_device *dev, int flush);
  208. int ipoib_ib_dev_stop(struct net_device *dev);
  209. int ipoib_dev_init(struct net_device *dev, struct ib_device *ca, int port);
  210. void ipoib_dev_cleanup(struct net_device *dev);
  211. void ipoib_mcast_join_task(void *dev_ptr);
  212. void ipoib_mcast_send(struct net_device *dev, union ib_gid *mgid,
  213. struct sk_buff *skb);
  214. void ipoib_mcast_restart_task(void *dev_ptr);
  215. int ipoib_mcast_start_thread(struct net_device *dev);
  216. int ipoib_mcast_stop_thread(struct net_device *dev, int flush);
  217. void ipoib_mcast_dev_down(struct net_device *dev);
  218. void ipoib_mcast_dev_flush(struct net_device *dev);
  219. #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
  220. struct ipoib_mcast_iter *ipoib_mcast_iter_init(struct net_device *dev);
  221. int ipoib_mcast_iter_next(struct ipoib_mcast_iter *iter);
  222. void ipoib_mcast_iter_read(struct ipoib_mcast_iter *iter,
  223. union ib_gid *gid,
  224. unsigned long *created,
  225. unsigned int *queuelen,
  226. unsigned int *complete,
  227. unsigned int *send_only);
  228. struct ipoib_path_iter *ipoib_path_iter_init(struct net_device *dev);
  229. int ipoib_path_iter_next(struct ipoib_path_iter *iter);
  230. void ipoib_path_iter_read(struct ipoib_path_iter *iter,
  231. struct ipoib_path *path);
  232. #endif
  233. int ipoib_mcast_attach(struct net_device *dev, u16 mlid,
  234. union ib_gid *mgid);
  235. int ipoib_mcast_detach(struct net_device *dev, u16 mlid,
  236. union ib_gid *mgid);
  237. int ipoib_init_qp(struct net_device *dev);
  238. int ipoib_transport_dev_init(struct net_device *dev, struct ib_device *ca);
  239. void ipoib_transport_dev_cleanup(struct net_device *dev);
  240. void ipoib_event(struct ib_event_handler *handler,
  241. struct ib_event *record);
  242. int ipoib_vlan_add(struct net_device *pdev, unsigned short pkey);
  243. int ipoib_vlan_delete(struct net_device *pdev, unsigned short pkey);
  244. void ipoib_pkey_poll(void *dev);
  245. int ipoib_pkey_dev_delay_open(struct net_device *dev);
  246. #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
  247. void ipoib_create_debug_files(struct net_device *dev);
  248. void ipoib_delete_debug_files(struct net_device *dev);
  249. int ipoib_register_debugfs(void);
  250. void ipoib_unregister_debugfs(void);
  251. #else
  252. static inline void ipoib_create_debug_files(struct net_device *dev) { }
  253. static inline void ipoib_delete_debug_files(struct net_device *dev) { }
  254. static inline int ipoib_register_debugfs(void) { return 0; }
  255. static inline void ipoib_unregister_debugfs(void) { }
  256. #endif
  257. #define ipoib_printk(level, priv, format, arg...) \
  258. printk(level "%s: " format, ((struct ipoib_dev_priv *) priv)->dev->name , ## arg)
  259. #define ipoib_warn(priv, format, arg...) \
  260. ipoib_printk(KERN_WARNING, priv, format , ## arg)
  261. #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
  262. extern int ipoib_debug_level;
  263. #define ipoib_dbg(priv, format, arg...) \
  264. do { \
  265. if (ipoib_debug_level > 0) \
  266. ipoib_printk(KERN_DEBUG, priv, format , ## arg); \
  267. } while (0)
  268. #define ipoib_dbg_mcast(priv, format, arg...) \
  269. do { \
  270. if (mcast_debug_level > 0) \
  271. ipoib_printk(KERN_DEBUG, priv, format , ## arg); \
  272. } while (0)
  273. #else /* CONFIG_INFINIBAND_IPOIB_DEBUG */
  274. #define ipoib_dbg(priv, format, arg...) \
  275. do { (void) (priv); } while (0)
  276. #define ipoib_dbg_mcast(priv, format, arg...) \
  277. do { (void) (priv); } while (0)
  278. #endif /* CONFIG_INFINIBAND_IPOIB_DEBUG */
  279. #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG_DATA
  280. #define ipoib_dbg_data(priv, format, arg...) \
  281. do { \
  282. if (data_debug_level > 0) \
  283. ipoib_printk(KERN_DEBUG, priv, format , ## arg); \
  284. } while (0)
  285. #else /* CONFIG_INFINIBAND_IPOIB_DEBUG_DATA */
  286. #define ipoib_dbg_data(priv, format, arg...) \
  287. do { (void) (priv); } while (0)
  288. #endif /* CONFIG_INFINIBAND_IPOIB_DEBUG_DATA */
  289. #define IPOIB_GID_FMT "%x:%x:%x:%x:%x:%x:%x:%x"
  290. #define IPOIB_GID_ARG(gid) be16_to_cpup((__be16 *) ((gid).raw + 0)), \
  291. be16_to_cpup((__be16 *) ((gid).raw + 2)), \
  292. be16_to_cpup((__be16 *) ((gid).raw + 4)), \
  293. be16_to_cpup((__be16 *) ((gid).raw + 6)), \
  294. be16_to_cpup((__be16 *) ((gid).raw + 8)), \
  295. be16_to_cpup((__be16 *) ((gid).raw + 10)), \
  296. be16_to_cpup((__be16 *) ((gid).raw + 12)), \
  297. be16_to_cpup((__be16 *) ((gid).raw + 14))
  298. #endif /* _IPOIB_H */