2 * Copyright (c) 2006, 2007 Cisco Systems. All rights reserved.
3 * Copyright (c) 2007, 2008 Mellanox Technologies. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
37 #include <linux/compiler.h>
38 #include <linux/list.h>
39 #include <linux/mutex.h>
41 #include <rdma/ib_verbs.h>
42 #include <rdma/ib_umem.h>
44 #include <linux/mlx4/device.h>
45 #include <linux/mlx4/doorbell.h>
47 #define MLX4_IB_DRV_NAME "mlx4_ib"
52 #define pr_fmt(fmt) "<" MLX4_IB_DRV_NAME "> %s: " fmt, __func__
54 #define mlx4_ib_warn(ibdev, format, arg...) \
55 dev_warn((ibdev)->dma_device, MLX4_IB_DRV_NAME ": " format, ## arg)
58 MLX4_IB_SQ_MIN_WQE_SHIFT = 6,
59 MLX4_IB_MAX_HEADROOM = 2048
62 #define MLX4_IB_SQ_HEADROOM(shift) ((MLX4_IB_MAX_HEADROOM >> (shift)) + 1)
63 #define MLX4_IB_SQ_MAX_SPARE (MLX4_IB_SQ_HEADROOM(MLX4_IB_SQ_MIN_WQE_SHIFT))
65 struct mlx4_ib_ucontext {
66 struct ib_ucontext ibucontext;
68 struct list_head db_page_list;
69 struct mutex db_page_mutex;
78 struct ib_xrcd ibxrcd;
84 struct mlx4_ib_cq_buf {
89 struct mlx4_ib_cq_resize {
90 struct mlx4_ib_cq_buf buf;
97 struct mlx4_ib_cq_buf buf;
98 struct mlx4_ib_cq_resize *resize_buf;
101 struct mutex resize_mutex;
102 struct ib_umem *umem;
103 struct ib_umem *resize_umem;
109 struct ib_umem *umem;
112 struct mlx4_ib_fast_reg_page_list {
113 struct ib_fast_reg_page_list ibfrpl;
114 __be64 *mapped_page_list;
120 struct mlx4_fmr mfmr;
135 enum mlx4_ib_qp_flags {
136 MLX4_IB_QP_LSO = IB_QP_CREATE_IPOIB_UD_LSO,
137 MLX4_IB_QP_BLOCK_MULTICAST_LOOPBACK = IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK,
138 MLX4_IB_SRIOV_TUNNEL_QP = 1 << 30,
139 MLX4_IB_SRIOV_SQP = 1 << 31,
142 struct mlx4_ib_gid_entry {
143 struct list_head list;
149 enum mlx4_ib_qp_type {
151 * IB_QPT_SMI and IB_QPT_GSI have to be the first two entries
152 * here (and in that order) since the MAD layer uses them as
153 * indices into a 2-entry table.
155 MLX4_IB_QPT_SMI = IB_QPT_SMI,
156 MLX4_IB_QPT_GSI = IB_QPT_GSI,
158 MLX4_IB_QPT_RC = IB_QPT_RC,
159 MLX4_IB_QPT_UC = IB_QPT_UC,
160 MLX4_IB_QPT_UD = IB_QPT_UD,
161 MLX4_IB_QPT_RAW_IPV6 = IB_QPT_RAW_IPV6,
162 MLX4_IB_QPT_RAW_ETHERTYPE = IB_QPT_RAW_ETHERTYPE,
163 MLX4_IB_QPT_RAW_PACKET = IB_QPT_RAW_PACKET,
164 MLX4_IB_QPT_XRC_INI = IB_QPT_XRC_INI,
165 MLX4_IB_QPT_XRC_TGT = IB_QPT_XRC_TGT,
167 MLX4_IB_QPT_PROXY_SMI_OWNER = 1 << 16,
168 MLX4_IB_QPT_PROXY_SMI = 1 << 17,
169 MLX4_IB_QPT_PROXY_GSI = 1 << 18,
170 MLX4_IB_QPT_TUN_SMI_OWNER = 1 << 19,
171 MLX4_IB_QPT_TUN_SMI = 1 << 20,
172 MLX4_IB_QPT_TUN_GSI = 1 << 21,
175 #define MLX4_IB_QPT_ANY_SRIOV (MLX4_IB_QPT_PROXY_SMI_OWNER | \
176 MLX4_IB_QPT_PROXY_SMI | MLX4_IB_QPT_PROXY_GSI | MLX4_IB_QPT_TUN_SMI_OWNER | \
177 MLX4_IB_QPT_TUN_SMI | MLX4_IB_QPT_TUN_GSI)
179 enum mlx4_ib_mad_ifc_flags {
180 MLX4_MAD_IFC_IGNORE_MKEY = 1,
181 MLX4_MAD_IFC_IGNORE_BKEY = 2,
182 MLX4_MAD_IFC_IGNORE_KEYS = (MLX4_MAD_IFC_IGNORE_MKEY |
183 MLX4_MAD_IFC_IGNORE_BKEY),
184 MLX4_MAD_IFC_NET_VIEW = 4,
188 MLX4_NUM_TUNNEL_BUFS = 256,
191 struct mlx4_ib_tunnel_header {
206 struct mlx4_rcv_tunnel_hdr {
207 __be32 flags_src_qp; /* flags[6:5] is defined for VLANs:
208 * 0x0 - no vlan was in the packet
209 * 0x01 - C-VLAN was in the packet */
210 u8 g_ml_path; /* gid bit stands for ipv6/4 header in RoCE */
214 __be16 slid_mac_47_32;
218 struct mlx4_ib_proxy_sqp_hdr {
220 struct mlx4_rcv_tunnel_hdr tun;
229 struct mlx4_ib_wq rq;
232 __be32 sq_signal_bits;
233 unsigned sq_next_wqe;
234 int sq_max_wqes_per_wr;
236 struct mlx4_ib_wq sq;
238 enum mlx4_ib_qp_type mlx4_ib_qp_type;
239 struct ib_umem *umem;
252 struct list_head gid_list;
253 struct list_head steering_rules;
254 struct mlx4_ib_buf *sqp_proxy_rcv;
260 struct mlx4_srq msrq;
268 struct ib_umem *umem;
275 union mlx4_ext_av av;
278 struct mlx4_ib_demux_work {
279 struct work_struct work;
280 struct mlx4_ib_dev *dev;
287 struct mlx4_ib_tun_tx_buf {
288 struct mlx4_ib_buf buf;
292 struct mlx4_ib_demux_pv_qp {
294 enum ib_qp_type proxy_qpt;
295 struct mlx4_ib_buf *ring;
296 struct mlx4_ib_tun_tx_buf *tx_ring;
302 enum mlx4_ib_demux_pv_state {
304 DEMUX_PV_STATE_STARTING,
305 DEMUX_PV_STATE_ACTIVE,
306 DEMUX_PV_STATE_DOWNING,
309 struct mlx4_ib_demux_pv_ctx {
312 enum mlx4_ib_demux_pv_state state;
314 struct ib_device *ib_dev;
318 struct work_struct work;
319 struct workqueue_struct *wq;
320 struct mlx4_ib_demux_pv_qp qp[2];
323 struct mlx4_ib_demux_ctx {
324 struct ib_device *ib_dev;
326 struct workqueue_struct *wq;
327 struct workqueue_struct *ud_wq;
329 __be64 subnet_prefix;
330 __be64 guid_cache[128];
331 struct mlx4_ib_dev *dev;
332 struct mlx4_ib_demux_pv_ctx **tun;
335 struct mlx4_ib_sriov {
336 struct mlx4_ib_demux_ctx demux[MLX4_MAX_PORTS];
337 struct mlx4_ib_demux_pv_ctx *sqps[MLX4_MAX_PORTS];
338 /* when using this spinlock you should use "irq" because
339 * it may be called from interrupt context.*/
340 spinlock_t going_down_lock;
344 struct mlx4_ib_iboe {
346 struct net_device *netdevs[MLX4_MAX_PORTS];
347 struct notifier_block nb;
348 union ib_gid gid_table[MLX4_MAX_PORTS][128];
352 u8 virt2phys_pkey[MLX4_MFUNC_MAX][MLX4_MAX_PORTS][MLX4_MAX_PORT_PKEYS];
353 u16 phys_pkey_cache[MLX4_MAX_PORTS][MLX4_MAX_PORT_PKEYS];
354 struct list_head pkey_port_list[MLX4_MFUNC_MAX];
355 struct kobject *device_parent[MLX4_MFUNC_MAX];
359 struct ib_device ib_dev;
360 struct mlx4_dev *dev;
362 void __iomem *uar_map;
364 struct mlx4_uar priv_uar;
366 MLX4_DECLARE_DOORBELL_LOCK(uar_lock);
368 struct ib_mad_agent *send_agent[MLX4_MAX_PORTS][2];
369 struct ib_ah *sm_ah[MLX4_MAX_PORTS];
371 struct mlx4_ib_sriov sriov;
373 struct mutex cap_mask_mutex;
375 struct mlx4_ib_iboe iboe;
376 int counters[MLX4_MAX_PORTS];
379 struct pkey_mgt pkeys;
382 struct ib_event_work {
383 struct work_struct work;
384 struct mlx4_ib_dev *ib_dev;
385 struct mlx4_eqe ib_eqe;
388 struct mlx4_ib_qp_tunnel_init_attr {
389 struct ib_qp_init_attr init_attr;
391 enum ib_qp_type proxy_qp_type;
395 static inline struct mlx4_ib_dev *to_mdev(struct ib_device *ibdev)
397 return container_of(ibdev, struct mlx4_ib_dev, ib_dev);
400 static inline struct mlx4_ib_ucontext *to_mucontext(struct ib_ucontext *ibucontext)
402 return container_of(ibucontext, struct mlx4_ib_ucontext, ibucontext);
405 static inline struct mlx4_ib_pd *to_mpd(struct ib_pd *ibpd)
407 return container_of(ibpd, struct mlx4_ib_pd, ibpd);
410 static inline struct mlx4_ib_xrcd *to_mxrcd(struct ib_xrcd *ibxrcd)
412 return container_of(ibxrcd, struct mlx4_ib_xrcd, ibxrcd);
415 static inline struct mlx4_ib_cq *to_mcq(struct ib_cq *ibcq)
417 return container_of(ibcq, struct mlx4_ib_cq, ibcq);
420 static inline struct mlx4_ib_cq *to_mibcq(struct mlx4_cq *mcq)
422 return container_of(mcq, struct mlx4_ib_cq, mcq);
425 static inline struct mlx4_ib_mr *to_mmr(struct ib_mr *ibmr)
427 return container_of(ibmr, struct mlx4_ib_mr, ibmr);
430 static inline struct mlx4_ib_fast_reg_page_list *to_mfrpl(struct ib_fast_reg_page_list *ibfrpl)
432 return container_of(ibfrpl, struct mlx4_ib_fast_reg_page_list, ibfrpl);
435 static inline struct mlx4_ib_fmr *to_mfmr(struct ib_fmr *ibfmr)
437 return container_of(ibfmr, struct mlx4_ib_fmr, ibfmr);
439 static inline struct mlx4_ib_qp *to_mqp(struct ib_qp *ibqp)
441 return container_of(ibqp, struct mlx4_ib_qp, ibqp);
444 static inline struct mlx4_ib_qp *to_mibqp(struct mlx4_qp *mqp)
446 return container_of(mqp, struct mlx4_ib_qp, mqp);
449 static inline struct mlx4_ib_srq *to_msrq(struct ib_srq *ibsrq)
451 return container_of(ibsrq, struct mlx4_ib_srq, ibsrq);
454 static inline struct mlx4_ib_srq *to_mibsrq(struct mlx4_srq *msrq)
456 return container_of(msrq, struct mlx4_ib_srq, msrq);
459 static inline struct mlx4_ib_ah *to_mah(struct ib_ah *ibah)
461 return container_of(ibah, struct mlx4_ib_ah, ibah);
464 int mlx4_ib_init_sriov(struct mlx4_ib_dev *dev);
465 void mlx4_ib_close_sriov(struct mlx4_ib_dev *dev);
467 int mlx4_ib_db_map_user(struct mlx4_ib_ucontext *context, unsigned long virt,
469 void mlx4_ib_db_unmap_user(struct mlx4_ib_ucontext *context, struct mlx4_db *db);
471 struct ib_mr *mlx4_ib_get_dma_mr(struct ib_pd *pd, int acc);
472 int mlx4_ib_umem_write_mtt(struct mlx4_ib_dev *dev, struct mlx4_mtt *mtt,
473 struct ib_umem *umem);
474 struct ib_mr *mlx4_ib_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,
475 u64 virt_addr, int access_flags,
476 struct ib_udata *udata);
477 int mlx4_ib_dereg_mr(struct ib_mr *mr);
478 struct ib_mr *mlx4_ib_alloc_fast_reg_mr(struct ib_pd *pd,
479 int max_page_list_len);
480 struct ib_fast_reg_page_list *mlx4_ib_alloc_fast_reg_page_list(struct ib_device *ibdev,
482 void mlx4_ib_free_fast_reg_page_list(struct ib_fast_reg_page_list *page_list);
484 int mlx4_ib_modify_cq(struct ib_cq *cq, u16 cq_count, u16 cq_period);
485 int mlx4_ib_resize_cq(struct ib_cq *ibcq, int entries, struct ib_udata *udata);
486 struct ib_cq *mlx4_ib_create_cq(struct ib_device *ibdev, int entries, int vector,
487 struct ib_ucontext *context,
488 struct ib_udata *udata);
489 int mlx4_ib_destroy_cq(struct ib_cq *cq);
490 int mlx4_ib_poll_cq(struct ib_cq *ibcq, int num_entries, struct ib_wc *wc);
491 int mlx4_ib_arm_cq(struct ib_cq *cq, enum ib_cq_notify_flags flags);
492 void __mlx4_ib_cq_clean(struct mlx4_ib_cq *cq, u32 qpn, struct mlx4_ib_srq *srq);
493 void mlx4_ib_cq_clean(struct mlx4_ib_cq *cq, u32 qpn, struct mlx4_ib_srq *srq);
495 struct ib_ah *mlx4_ib_create_ah(struct ib_pd *pd, struct ib_ah_attr *ah_attr);
496 int mlx4_ib_query_ah(struct ib_ah *ibah, struct ib_ah_attr *ah_attr);
497 int mlx4_ib_destroy_ah(struct ib_ah *ah);
499 struct ib_srq *mlx4_ib_create_srq(struct ib_pd *pd,
500 struct ib_srq_init_attr *init_attr,
501 struct ib_udata *udata);
502 int mlx4_ib_modify_srq(struct ib_srq *ibsrq, struct ib_srq_attr *attr,
503 enum ib_srq_attr_mask attr_mask, struct ib_udata *udata);
504 int mlx4_ib_query_srq(struct ib_srq *srq, struct ib_srq_attr *srq_attr);
505 int mlx4_ib_destroy_srq(struct ib_srq *srq);
506 void mlx4_ib_free_srq_wqe(struct mlx4_ib_srq *srq, int wqe_index);
507 int mlx4_ib_post_srq_recv(struct ib_srq *ibsrq, struct ib_recv_wr *wr,
508 struct ib_recv_wr **bad_wr);
510 struct ib_qp *mlx4_ib_create_qp(struct ib_pd *pd,
511 struct ib_qp_init_attr *init_attr,
512 struct ib_udata *udata);
513 int mlx4_ib_destroy_qp(struct ib_qp *qp);
514 int mlx4_ib_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *attr,
515 int attr_mask, struct ib_udata *udata);
516 int mlx4_ib_query_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr, int qp_attr_mask,
517 struct ib_qp_init_attr *qp_init_attr);
518 int mlx4_ib_post_send(struct ib_qp *ibqp, struct ib_send_wr *wr,
519 struct ib_send_wr **bad_wr);
520 int mlx4_ib_post_recv(struct ib_qp *ibqp, struct ib_recv_wr *wr,
521 struct ib_recv_wr **bad_wr);
523 int mlx4_MAD_IFC(struct mlx4_ib_dev *dev, int mad_ifc_flags,
524 int port, struct ib_wc *in_wc, struct ib_grh *in_grh,
525 void *in_mad, void *response_mad);
526 int mlx4_ib_process_mad(struct ib_device *ibdev, int mad_flags, u8 port_num,
527 struct ib_wc *in_wc, struct ib_grh *in_grh,
528 struct ib_mad *in_mad, struct ib_mad *out_mad);
529 int mlx4_ib_mad_init(struct mlx4_ib_dev *dev);
530 void mlx4_ib_mad_cleanup(struct mlx4_ib_dev *dev);
532 struct ib_fmr *mlx4_ib_fmr_alloc(struct ib_pd *pd, int mr_access_flags,
533 struct ib_fmr_attr *fmr_attr);
534 int mlx4_ib_map_phys_fmr(struct ib_fmr *ibfmr, u64 *page_list, int npages,
536 int mlx4_ib_unmap_fmr(struct list_head *fmr_list);
537 int mlx4_ib_fmr_dealloc(struct ib_fmr *fmr);
538 int __mlx4_ib_query_port(struct ib_device *ibdev, u8 port,
539 struct ib_port_attr *props, int netw_view);
540 int __mlx4_ib_query_pkey(struct ib_device *ibdev, u8 port, u16 index,
541 u16 *pkey, int netw_view);
543 int mlx4_ib_resolve_grh(struct mlx4_ib_dev *dev, const struct ib_ah_attr *ah_attr,
544 u8 *mac, int *is_mcast, u8 port);
546 static inline int mlx4_ib_ah_grh_present(struct mlx4_ib_ah *ah)
548 u8 port = be32_to_cpu(ah->av.ib.port_pd) >> 24 & 3;
550 if (rdma_port_get_link_layer(ah->ibah.device, port) == IB_LINK_LAYER_ETHERNET)
553 return !!(ah->av.ib.g_slid & 0x80);
556 int mlx4_ib_add_mc(struct mlx4_ib_dev *mdev, struct mlx4_ib_qp *mqp,
559 void mlx4_ib_dispatch_event(struct mlx4_ib_dev *dev, u8 port_num,
560 enum ib_event_type type);
562 void mlx4_ib_tunnels_update_work(struct work_struct *work);
564 #endif /* MLX4_IB_H */