1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35#ifndef _IPOIB_H
36#define _IPOIB_H
37
38#include <linux/list.h>
39#include <linux/skbuff.h>
40#include <linux/netdevice.h>
41#include <linux/workqueue.h>
42#include <linux/kref.h>
43#include <linux/if_infiniband.h>
44#include <linux/mutex.h>
45
46#include <net/neighbour.h>
47
48#include <asm/atomic.h>
49
50#include <rdma/ib_verbs.h>
51#include <rdma/ib_pack.h>
52#include <rdma/ib_sa.h>
53#include <linux/inet_lro.h>
54
55
56
57enum ipoib_flush_level {
58 IPOIB_FLUSH_LIGHT,
59 IPOIB_FLUSH_NORMAL,
60 IPOIB_FLUSH_HEAVY
61};
62
63enum {
64 IPOIB_ENCAP_LEN = 4,
65
66 IPOIB_UD_HEAD_SIZE = IB_GRH_BYTES + IPOIB_ENCAP_LEN,
67 IPOIB_UD_RX_SG = 2,
68
69 IPOIB_CM_MTU = 0x10000 - 0x10,
70 IPOIB_CM_BUF_SIZE = IPOIB_CM_MTU + IPOIB_ENCAP_LEN,
71 IPOIB_CM_HEAD_SIZE = IPOIB_CM_BUF_SIZE % PAGE_SIZE,
72 IPOIB_CM_RX_SG = ALIGN(IPOIB_CM_BUF_SIZE, PAGE_SIZE) / PAGE_SIZE,
73 IPOIB_RX_RING_SIZE = 256,
74 IPOIB_TX_RING_SIZE = 128,
75 IPOIB_MAX_QUEUE_SIZE = 8192,
76 IPOIB_MIN_QUEUE_SIZE = 2,
77 IPOIB_CM_MAX_CONN_QP = 4096,
78
79 IPOIB_NUM_WC = 4,
80
81 IPOIB_MAX_PATH_REC_QUEUE = 3,
82 IPOIB_MAX_MCAST_QUEUE = 3,
83
84 IPOIB_FLAG_OPER_UP = 0,
85 IPOIB_FLAG_INITIALIZED = 1,
86 IPOIB_FLAG_ADMIN_UP = 2,
87 IPOIB_PKEY_ASSIGNED = 3,
88 IPOIB_PKEY_STOP = 4,
89 IPOIB_FLAG_SUBINTERFACE = 5,
90 IPOIB_MCAST_RUN = 6,
91 IPOIB_STOP_REAPER = 7,
92 IPOIB_FLAG_ADMIN_CM = 9,
93 IPOIB_FLAG_UMCAST = 10,
94 IPOIB_FLAG_CSUM = 11,
95
96 IPOIB_MAX_BACKOFF_SECONDS = 16,
97
98 IPOIB_MCAST_FLAG_FOUND = 0,
99 IPOIB_MCAST_FLAG_SENDONLY = 1,
100 IPOIB_MCAST_FLAG_BUSY = 2,
101 IPOIB_MCAST_FLAG_ATTACHED = 3,
102
103 IPOIB_MAX_LRO_DESCRIPTORS = 8,
104 IPOIB_LRO_MAX_AGGR = 64,
105
106 MAX_SEND_CQE = 16,
107 IPOIB_CM_COPYBREAK = 256,
108};
109
110#define IPOIB_OP_RECV (1ul << 31)
111#ifdef CONFIG_INFINIBAND_IPOIB_CM
112#define IPOIB_OP_CM (1ul << 30)
113#else
114#define IPOIB_OP_CM (0)
115#endif
116
117
118
119struct ipoib_header {
120 __be16 proto;
121 u16 reserved;
122};
123
124struct ipoib_pseudoheader {
125 u8 hwaddr[INFINIBAND_ALEN];
126};
127
128
129struct ipoib_mcast {
130 struct ib_sa_mcmember_rec mcmember;
131 struct ib_sa_multicast *mc;
132 struct ipoib_ah *ah;
133
134 struct rb_node rb_node;
135 struct list_head list;
136
137 unsigned long created;
138 unsigned long backoff;
139
140 unsigned long flags;
141 unsigned char logcount;
142
143 struct list_head neigh_list;
144
145 struct sk_buff_head pkt_queue;
146
147 struct net_device *dev;
148};
149
150struct ipoib_rx_buf {
151 struct sk_buff *skb;
152 u64 mapping[IPOIB_UD_RX_SG];
153};
154
155struct ipoib_tx_buf {
156 struct sk_buff *skb;
157 u64 mapping[MAX_SKB_FRAGS + 1];
158};
159
160struct ipoib_cm_tx_buf {
161 struct sk_buff *skb;
162 u64 mapping;
163};
164
165struct ib_cm_id;
166
167struct ipoib_cm_data {
168 __be32 qpn;
169 __be32 mtu;
170};
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199enum ipoib_cm_state {
200 IPOIB_CM_RX_LIVE,
201 IPOIB_CM_RX_ERROR,
202 IPOIB_CM_RX_FLUSH
203};
204
205struct ipoib_cm_rx {
206 struct ib_cm_id *id;
207 struct ib_qp *qp;
208 struct ipoib_cm_rx_buf *rx_ring;
209 struct list_head list;
210 struct net_device *dev;
211 unsigned long jiffies;
212 enum ipoib_cm_state state;
213 int recv_count;
214};
215
216struct ipoib_cm_tx {
217 struct ib_cm_id *id;
218 struct ib_qp *qp;
219 struct list_head list;
220 struct net_device *dev;
221 struct ipoib_neigh *neigh;
222 struct ipoib_path *path;
223 struct ipoib_cm_tx_buf *tx_ring;
224 unsigned tx_head;
225 unsigned tx_tail;
226 unsigned long flags;
227 u32 mtu;
228};
229
230struct ipoib_cm_rx_buf {
231 struct sk_buff *skb;
232 u64 mapping[IPOIB_CM_RX_SG];
233};
234
235struct ipoib_cm_dev_priv {
236 struct ib_srq *srq;
237 struct ipoib_cm_rx_buf *srq_ring;
238 struct ib_cm_id *id;
239 struct list_head passive_ids;
240 struct list_head rx_error_list;
241 struct list_head rx_flush_list;
242 struct list_head rx_drain_list;
243 struct list_head rx_reap_list;
244 struct work_struct start_task;
245 struct work_struct reap_task;
246 struct work_struct skb_task;
247 struct work_struct rx_reap_task;
248 struct delayed_work stale_task;
249 struct sk_buff_head skb_queue;
250 struct list_head start_list;
251 struct list_head reap_list;
252 struct ib_wc ibwc[IPOIB_NUM_WC];
253 struct ib_sge rx_sge[IPOIB_CM_RX_SG];
254 struct ib_recv_wr rx_wr;
255 int nonsrq_conn_qp;
256 int max_cm_mtu;
257 int num_frags;
258};
259
260struct ipoib_ethtool_st {
261 u16 coalesce_usecs;
262 u16 max_coalesced_frames;
263};
264
265struct ipoib_lro {
266 struct net_lro_mgr lro_mgr;
267 struct net_lro_desc lro_desc[IPOIB_MAX_LRO_DESCRIPTORS];
268};
269
270
271
272
273
274
275struct ipoib_dev_priv {
276 spinlock_t lock;
277
278 struct net_device *dev;
279
280 struct napi_struct napi;
281
282 unsigned long flags;
283
284 struct mutex vlan_mutex;
285
286 struct rb_root path_tree;
287 struct list_head path_list;
288
289 struct ipoib_mcast *broadcast;
290 struct list_head multicast_list;
291 struct rb_root multicast_tree;
292
293 struct delayed_work pkey_poll_task;
294 struct delayed_work mcast_task;
295 struct work_struct carrier_on_task;
296 struct work_struct flush_light;
297 struct work_struct flush_normal;
298 struct work_struct flush_heavy;
299 struct work_struct restart_task;
300 struct delayed_work ah_reap_task;
301
302 struct ib_device *ca;
303 u8 port;
304 u16 pkey;
305 u16 pkey_index;
306 struct ib_pd *pd;
307 struct ib_mr *mr;
308 struct ib_cq *recv_cq;
309 struct ib_cq *send_cq;
310 struct ib_qp *qp;
311 u32 qkey;
312
313 union ib_gid local_gid;
314 u16 local_lid;
315
316 unsigned int admin_mtu;
317 unsigned int mcast_mtu;
318 unsigned int max_ib_mtu;
319
320 struct ipoib_rx_buf *rx_ring;
321
322 struct ipoib_tx_buf *tx_ring;
323 unsigned tx_head;
324 unsigned tx_tail;
325 struct ib_sge tx_sge[MAX_SKB_FRAGS + 1];
326 struct ib_send_wr tx_wr;
327 unsigned tx_outstanding;
328 struct ib_wc send_wc[MAX_SEND_CQE];
329
330 struct ib_recv_wr rx_wr;
331 struct ib_sge rx_sge[IPOIB_UD_RX_SG];
332
333 struct ib_wc ibwc[IPOIB_NUM_WC];
334
335 struct list_head dead_ahs;
336
337 struct ib_event_handler event_handler;
338
339 struct net_device *parent;
340 struct list_head child_intfs;
341 struct list_head list;
342
343#ifdef CONFIG_INFINIBAND_IPOIB_CM
344 struct ipoib_cm_dev_priv cm;
345#endif
346
347#ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
348 struct list_head fs_list;
349 struct dentry *mcg_dentry;
350 struct dentry *path_dentry;
351#endif
352 int hca_caps;
353 struct ipoib_ethtool_st ethtool;
354 struct timer_list poll_timer;
355
356 struct ipoib_lro lro;
357};
358
359struct ipoib_ah {
360 struct net_device *dev;
361 struct ib_ah *ah;
362 struct list_head list;
363 struct kref ref;
364 unsigned last_send;
365};
366
367struct ipoib_path {
368 struct net_device *dev;
369 struct ib_sa_path_rec pathrec;
370 struct ipoib_ah *ah;
371 struct sk_buff_head queue;
372
373 struct list_head neigh_list;
374
375 int query_id;
376 struct ib_sa_query *query;
377 struct completion done;
378
379 struct rb_node rb_node;
380 struct list_head list;
381 int valid;
382};
383
384struct ipoib_neigh {
385 struct ipoib_ah *ah;
386#ifdef CONFIG_INFINIBAND_IPOIB_CM
387 struct ipoib_cm_tx *cm;
388#endif
389 union ib_gid dgid;
390 struct sk_buff_head queue;
391
392 struct neighbour *neighbour;
393 struct net_device *dev;
394
395 struct list_head list;
396};
397
398#define IPOIB_UD_MTU(ib_mtu) (ib_mtu - IPOIB_ENCAP_LEN)
399#define IPOIB_UD_BUF_SIZE(ib_mtu) (ib_mtu + IB_GRH_BYTES)
400
401static inline int ipoib_ud_need_sg(unsigned int ib_mtu)
402{
403 return IPOIB_UD_BUF_SIZE(ib_mtu) > PAGE_SIZE;
404}
405
406
407
408
409
410
411
412static inline struct ipoib_neigh **to_ipoib_neigh(struct neighbour *neigh)
413{
414 return (void*) neigh + ALIGN(offsetof(struct neighbour, ha) +
415 INFINIBAND_ALEN, sizeof(void *));
416}
417
418struct ipoib_neigh *ipoib_neigh_alloc(struct neighbour *neigh,
419 struct net_device *dev);
420void ipoib_neigh_free(struct net_device *dev, struct ipoib_neigh *neigh);
421
422extern struct workqueue_struct *ipoib_workqueue;
423
424
425
426int ipoib_poll(struct napi_struct *napi, int budget);
427void ipoib_ib_completion(struct ib_cq *cq, void *dev_ptr);
428void ipoib_send_comp_handler(struct ib_cq *cq, void *dev_ptr);
429
430struct ipoib_ah *ipoib_create_ah(struct net_device *dev,
431 struct ib_pd *pd, struct ib_ah_attr *attr);
432void ipoib_free_ah(struct kref *kref);
433static inline void ipoib_put_ah(struct ipoib_ah *ah)
434{
435 kref_put(&ah->ref, ipoib_free_ah);
436}
437
438int ipoib_open(struct net_device *dev);
439int ipoib_add_pkey_attr(struct net_device *dev);
440int ipoib_add_umcast_attr(struct net_device *dev);
441
442void ipoib_send(struct net_device *dev, struct sk_buff *skb,
443 struct ipoib_ah *address, u32 qpn);
444void ipoib_reap_ah(struct work_struct *work);
445
446void ipoib_mark_paths_invalid(struct net_device *dev);
447void ipoib_flush_paths(struct net_device *dev);
448struct ipoib_dev_priv *ipoib_intf_alloc(const char *format);
449
450int ipoib_ib_dev_init(struct net_device *dev, struct ib_device *ca, int port);
451void ipoib_ib_dev_flush_light(struct work_struct *work);
452void ipoib_ib_dev_flush_normal(struct work_struct *work);
453void ipoib_ib_dev_flush_heavy(struct work_struct *work);
454void ipoib_pkey_event(struct work_struct *work);
455void ipoib_ib_dev_cleanup(struct net_device *dev);
456
457int ipoib_ib_dev_open(struct net_device *dev);
458int ipoib_ib_dev_up(struct net_device *dev);
459int ipoib_ib_dev_down(struct net_device *dev, int flush);
460int ipoib_ib_dev_stop(struct net_device *dev, int flush);
461
462int ipoib_dev_init(struct net_device *dev, struct ib_device *ca, int port);
463void ipoib_dev_cleanup(struct net_device *dev);
464
465void ipoib_mcast_join_task(struct work_struct *work);
466void ipoib_mcast_carrier_on_task(struct work_struct *work);
467void ipoib_mcast_send(struct net_device *dev, void *mgid, struct sk_buff *skb);
468
469void ipoib_mcast_restart_task(struct work_struct *work);
470int ipoib_mcast_start_thread(struct net_device *dev);
471int ipoib_mcast_stop_thread(struct net_device *dev, int flush);
472
473void ipoib_mcast_dev_down(struct net_device *dev);
474void ipoib_mcast_dev_flush(struct net_device *dev);
475
476#ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
477struct ipoib_mcast_iter *ipoib_mcast_iter_init(struct net_device *dev);
478int ipoib_mcast_iter_next(struct ipoib_mcast_iter *iter);
479void ipoib_mcast_iter_read(struct ipoib_mcast_iter *iter,
480 union ib_gid *gid,
481 unsigned long *created,
482 unsigned int *queuelen,
483 unsigned int *complete,
484 unsigned int *send_only);
485
486struct ipoib_path_iter *ipoib_path_iter_init(struct net_device *dev);
487int ipoib_path_iter_next(struct ipoib_path_iter *iter);
488void ipoib_path_iter_read(struct ipoib_path_iter *iter,
489 struct ipoib_path *path);
490#endif
491
492int ipoib_mcast_attach(struct net_device *dev, u16 mlid,
493 union ib_gid *mgid, int set_qkey);
494
495int ipoib_init_qp(struct net_device *dev);
496int ipoib_transport_dev_init(struct net_device *dev, struct ib_device *ca);
497void ipoib_transport_dev_cleanup(struct net_device *dev);
498
499void ipoib_event(struct ib_event_handler *handler,
500 struct ib_event *record);
501
502int ipoib_vlan_add(struct net_device *pdev, unsigned short pkey);
503int ipoib_vlan_delete(struct net_device *pdev, unsigned short pkey);
504
505void ipoib_pkey_poll(struct work_struct *work);
506int ipoib_pkey_dev_delay_open(struct net_device *dev);
507void ipoib_drain_cq(struct net_device *dev);
508
509void ipoib_set_ethtool_ops(struct net_device *dev);
510int ipoib_set_dev_features(struct ipoib_dev_priv *priv, struct ib_device *hca);
511
512#ifdef CONFIG_INFINIBAND_IPOIB_CM
513
514#define IPOIB_FLAGS_RC 0x80
515#define IPOIB_FLAGS_UC 0x40
516
517
518#define IPOIB_CM_SUPPORTED(ha) (ha[0] & (IPOIB_FLAGS_RC))
519
520extern int ipoib_max_conn_qp;
521
522static inline int ipoib_cm_admin_enabled(struct net_device *dev)
523{
524 struct ipoib_dev_priv *priv = netdev_priv(dev);
525 return IPOIB_CM_SUPPORTED(dev->dev_addr) &&
526 test_bit(IPOIB_FLAG_ADMIN_CM, &priv->flags);
527}
528
529static inline int ipoib_cm_enabled(struct net_device *dev, struct neighbour *n)
530{
531 struct ipoib_dev_priv *priv = netdev_priv(dev);
532 return IPOIB_CM_SUPPORTED(n->ha) &&
533 test_bit(IPOIB_FLAG_ADMIN_CM, &priv->flags);
534}
535
536static inline int ipoib_cm_up(struct ipoib_neigh *neigh)
537
538{
539 return test_bit(IPOIB_FLAG_OPER_UP, &neigh->cm->flags);
540}
541
542static inline struct ipoib_cm_tx *ipoib_cm_get(struct ipoib_neigh *neigh)
543{
544 return neigh->cm;
545}
546
547static inline void ipoib_cm_set(struct ipoib_neigh *neigh, struct ipoib_cm_tx *tx)
548{
549 neigh->cm = tx;
550}
551
552static inline int ipoib_cm_has_srq(struct net_device *dev)
553{
554 struct ipoib_dev_priv *priv = netdev_priv(dev);
555 return !!priv->cm.srq;
556}
557
558static inline unsigned int ipoib_cm_max_mtu(struct net_device *dev)
559{
560 struct ipoib_dev_priv *priv = netdev_priv(dev);
561 return priv->cm.max_cm_mtu;
562}
563
564void ipoib_cm_send(struct net_device *dev, struct sk_buff *skb, struct ipoib_cm_tx *tx);
565int ipoib_cm_dev_open(struct net_device *dev);
566void ipoib_cm_dev_stop(struct net_device *dev);
567int ipoib_cm_dev_init(struct net_device *dev);
568int ipoib_cm_add_mode_attr(struct net_device *dev);
569void ipoib_cm_dev_cleanup(struct net_device *dev);
570struct ipoib_cm_tx *ipoib_cm_create_tx(struct net_device *dev, struct ipoib_path *path,
571 struct ipoib_neigh *neigh);
572void ipoib_cm_destroy_tx(struct ipoib_cm_tx *tx);
573void ipoib_cm_skb_too_long(struct net_device *dev, struct sk_buff *skb,
574 unsigned int mtu);
575void ipoib_cm_handle_rx_wc(struct net_device *dev, struct ib_wc *wc);
576void ipoib_cm_handle_tx_wc(struct net_device *dev, struct ib_wc *wc);
577#else
578
579struct ipoib_cm_tx;
580
581#define ipoib_max_conn_qp 0
582
583static inline int ipoib_cm_admin_enabled(struct net_device *dev)
584{
585 return 0;
586}
587static inline int ipoib_cm_enabled(struct net_device *dev, struct neighbour *n)
588
589{
590 return 0;
591}
592
593static inline int ipoib_cm_up(struct ipoib_neigh *neigh)
594
595{
596 return 0;
597}
598
599static inline struct ipoib_cm_tx *ipoib_cm_get(struct ipoib_neigh *neigh)
600{
601 return NULL;
602}
603
604static inline void ipoib_cm_set(struct ipoib_neigh *neigh, struct ipoib_cm_tx *tx)
605{
606}
607
608static inline int ipoib_cm_has_srq(struct net_device *dev)
609{
610 return 0;
611}
612
613static inline unsigned int ipoib_cm_max_mtu(struct net_device *dev)
614{
615 return 0;
616}
617
618static inline
619void ipoib_cm_send(struct net_device *dev, struct sk_buff *skb, struct ipoib_cm_tx *tx)
620{
621 return;
622}
623
624static inline
625int ipoib_cm_dev_open(struct net_device *dev)
626{
627 return 0;
628}
629
630static inline
631void ipoib_cm_dev_stop(struct net_device *dev)
632{
633 return;
634}
635
636static inline
637int ipoib_cm_dev_init(struct net_device *dev)
638{
639 return -ENOSYS;
640}
641
642static inline
643void ipoib_cm_dev_cleanup(struct net_device *dev)
644{
645 return;
646}
647
648static inline
649struct ipoib_cm_tx *ipoib_cm_create_tx(struct net_device *dev, struct ipoib_path *path,
650 struct ipoib_neigh *neigh)
651{
652 return NULL;
653}
654
655static inline
656void ipoib_cm_destroy_tx(struct ipoib_cm_tx *tx)
657{
658 return;
659}
660
661static inline
662int ipoib_cm_add_mode_attr(struct net_device *dev)
663{
664 return 0;
665}
666
667static inline void ipoib_cm_skb_too_long(struct net_device *dev, struct sk_buff *skb,
668 unsigned int mtu)
669{
670 dev_kfree_skb_any(skb);
671}
672
673static inline void ipoib_cm_handle_rx_wc(struct net_device *dev, struct ib_wc *wc)
674{
675}
676
677static inline void ipoib_cm_handle_tx_wc(struct net_device *dev, struct ib_wc *wc)
678{
679}
680#endif
681
682#ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
683void ipoib_create_debug_files(struct net_device *dev);
684void ipoib_delete_debug_files(struct net_device *dev);
685int ipoib_register_debugfs(void);
686void ipoib_unregister_debugfs(void);
687#else
688static inline void ipoib_create_debug_files(struct net_device *dev) { }
689static inline void ipoib_delete_debug_files(struct net_device *dev) { }
690static inline int ipoib_register_debugfs(void) { return 0; }
691static inline void ipoib_unregister_debugfs(void) { }
692#endif
693
694#define ipoib_printk(level, priv, format, arg...) \
695 printk(level "%s: " format, ((struct ipoib_dev_priv *) priv)->dev->name , ## arg)
696#define ipoib_warn(priv, format, arg...) \
697 ipoib_printk(KERN_WARNING, priv, format , ## arg)
698
699extern int ipoib_sendq_size;
700extern int ipoib_recvq_size;
701
702extern struct ib_sa_client ipoib_sa_client;
703
704#ifdef CONFIG_INFINIBAND_IPOIB_DEBUG
705extern int ipoib_debug_level;
706
707#define ipoib_dbg(priv, format, arg...) \
708 do { \
709 if (ipoib_debug_level > 0) \
710 ipoib_printk(KERN_DEBUG, priv, format , ## arg); \
711 } while (0)
712#define ipoib_dbg_mcast(priv, format, arg...) \
713 do { \
714 if (mcast_debug_level > 0) \
715 ipoib_printk(KERN_DEBUG, priv, format , ## arg); \
716 } while (0)
717#else
718#define ipoib_dbg(priv, format, arg...) \
719 do { (void) (priv); } while (0)
720#define ipoib_dbg_mcast(priv, format, arg...) \
721 do { (void) (priv); } while (0)
722#endif
723
724#ifdef CONFIG_INFINIBAND_IPOIB_DEBUG_DATA
725#define ipoib_dbg_data(priv, format, arg...) \
726 do { \
727 if (data_debug_level > 0) \
728 ipoib_printk(KERN_DEBUG, priv, format , ## arg); \
729 } while (0)
730#else
731#define ipoib_dbg_data(priv, format, arg...) \
732 do { (void) (priv); } while (0)
733#endif
734
735#define IPOIB_QPN(ha) (be32_to_cpup((__be32 *) ha) & 0xffffff)
736
737#endif
738