1 /* QLogic qedr NIC Driver
2 * Copyright (c) 2015-2016 QLogic Corporation
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and /or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32 #include <linux/module.h>
33 #include <rdma/ib_verbs.h>
34 #include <rdma/ib_addr.h>
35 #include <rdma/ib_user_verbs.h>
36 #include <linux/netdevice.h>
37 #include <linux/iommu.h>
38 #include <net/addrconf.h>
39 #include <linux/qed/qede_roce.h>
40 #include <linux/qed/qed_chain.h>
41 #include <linux/qed/qed_if.h>
44 #include <rdma/qedr-abi.h>
46 MODULE_DESCRIPTION("QLogic 40G/100G ROCE Driver");
47 MODULE_AUTHOR("QLogic Corporation");
48 MODULE_LICENSE("Dual BSD/GPL");
49 MODULE_VERSION(QEDR_MODULE_VERSION);
51 #define QEDR_WQ_MULTIPLIER_DFT (3)
53 void qedr_ib_dispatch_event(struct qedr_dev *dev, u8 port_num,
54 enum ib_event_type type)
58 ibev.device = &dev->ibdev;
59 ibev.element.port_num = port_num;
62 ib_dispatch_event(&ibev);
65 static enum rdma_link_layer qedr_link_layer(struct ib_device *device,
68 return IB_LINK_LAYER_ETHERNET;
71 static void qedr_get_dev_fw_str(struct ib_device *ibdev, char *str,
74 struct qedr_dev *qedr = get_qedr_dev(ibdev);
75 u32 fw_ver = (u32)qedr->attr.fw_ver;
77 snprintf(str, str_len, "%d. %d. %d. %d",
78 (fw_ver >> 24) & 0xFF, (fw_ver >> 16) & 0xFF,
79 (fw_ver >> 8) & 0xFF, fw_ver & 0xFF);
82 static int qedr_register_device(struct qedr_dev *dev)
84 strlcpy(dev->ibdev.name, "qedr%d", IB_DEVICE_NAME_MAX);
86 memcpy(dev->ibdev.node_desc, QEDR_NODE_DESC, sizeof(QEDR_NODE_DESC));
87 dev->ibdev.owner = THIS_MODULE;
88 dev->ibdev.uverbs_abi_ver = QEDR_ABI_VERSION;
90 dev->ibdev.uverbs_cmd_mask = QEDR_UVERBS(GET_CONTEXT) |
91 QEDR_UVERBS(QUERY_DEVICE) |
92 QEDR_UVERBS(QUERY_PORT) |
93 QEDR_UVERBS(ALLOC_PD) |
94 QEDR_UVERBS(DEALLOC_PD) |
95 QEDR_UVERBS(CREATE_COMP_CHANNEL) |
96 QEDR_UVERBS(CREATE_CQ) |
97 QEDR_UVERBS(RESIZE_CQ) |
98 QEDR_UVERBS(DESTROY_CQ) |
99 QEDR_UVERBS(REQ_NOTIFY_CQ) |
100 QEDR_UVERBS(CREATE_QP) |
101 QEDR_UVERBS(MODIFY_QP) |
102 QEDR_UVERBS(QUERY_QP) |
103 QEDR_UVERBS(DESTROY_QP);
105 dev->ibdev.phys_port_cnt = 1;
106 dev->ibdev.num_comp_vectors = dev->num_cnq;
107 dev->ibdev.node_type = RDMA_NODE_IB_CA;
109 dev->ibdev.query_device = qedr_query_device;
110 dev->ibdev.query_port = qedr_query_port;
111 dev->ibdev.modify_port = qedr_modify_port;
113 dev->ibdev.query_gid = qedr_query_gid;
114 dev->ibdev.add_gid = qedr_add_gid;
115 dev->ibdev.del_gid = qedr_del_gid;
117 dev->ibdev.alloc_ucontext = qedr_alloc_ucontext;
118 dev->ibdev.dealloc_ucontext = qedr_dealloc_ucontext;
119 dev->ibdev.mmap = qedr_mmap;
121 dev->ibdev.alloc_pd = qedr_alloc_pd;
122 dev->ibdev.dealloc_pd = qedr_dealloc_pd;
124 dev->ibdev.create_cq = qedr_create_cq;
125 dev->ibdev.destroy_cq = qedr_destroy_cq;
126 dev->ibdev.resize_cq = qedr_resize_cq;
127 dev->ibdev.req_notify_cq = qedr_arm_cq;
129 dev->ibdev.create_qp = qedr_create_qp;
130 dev->ibdev.modify_qp = qedr_modify_qp;
131 dev->ibdev.query_qp = qedr_query_qp;
132 dev->ibdev.destroy_qp = qedr_destroy_qp;
134 dev->ibdev.query_pkey = qedr_query_pkey;
136 dev->ibdev.dma_device = &dev->pdev->dev;
138 dev->ibdev.get_link_layer = qedr_link_layer;
139 dev->ibdev.get_dev_fw_str = qedr_get_dev_fw_str;
144 /* This function allocates fast-path status block memory */
145 static int qedr_alloc_mem_sb(struct qedr_dev *dev,
146 struct qed_sb_info *sb_info, u16 sb_id)
148 struct status_block *sb_virt;
152 sb_virt = dma_alloc_coherent(&dev->pdev->dev,
153 sizeof(*sb_virt), &sb_phys, GFP_KERNEL);
157 rc = dev->ops->common->sb_init(dev->cdev, sb_info,
158 sb_virt, sb_phys, sb_id,
161 pr_err("Status block initialization failed\n");
162 dma_free_coherent(&dev->pdev->dev, sizeof(*sb_virt),
170 static void qedr_free_mem_sb(struct qedr_dev *dev,
171 struct qed_sb_info *sb_info, int sb_id)
173 if (sb_info->sb_virt) {
174 dev->ops->common->sb_release(dev->cdev, sb_info, sb_id);
175 dma_free_coherent(&dev->pdev->dev, sizeof(*sb_info->sb_virt),
176 (void *)sb_info->sb_virt, sb_info->sb_phys);
180 static void qedr_free_resources(struct qedr_dev *dev)
184 for (i = 0; i < dev->num_cnq; i++) {
185 qedr_free_mem_sb(dev, &dev->sb_array[i], dev->sb_start + i);
186 dev->ops->common->chain_free(dev->cdev, &dev->cnq_array[i].pbl);
189 kfree(dev->cnq_array);
190 kfree(dev->sb_array);
191 kfree(dev->sgid_tbl);
194 static int qedr_alloc_resources(struct qedr_dev *dev)
196 struct qedr_cnq *cnq;
201 dev->sgid_tbl = kzalloc(sizeof(union ib_gid) *
202 QEDR_MAX_SGID, GFP_KERNEL);
206 spin_lock_init(&dev->sgid_lock);
208 /* Allocate Status blocks for CNQ */
209 dev->sb_array = kcalloc(dev->num_cnq, sizeof(*dev->sb_array),
211 if (!dev->sb_array) {
216 dev->cnq_array = kcalloc(dev->num_cnq,
217 sizeof(*dev->cnq_array), GFP_KERNEL);
218 if (!dev->cnq_array) {
223 dev->sb_start = dev->ops->rdma_get_start_sb(dev->cdev);
225 /* Allocate CNQ PBLs */
226 n_entries = min_t(u32, QED_RDMA_MAX_CNQ_SIZE, QEDR_ROCE_MAX_CNQ_SIZE);
227 for (i = 0; i < dev->num_cnq; i++) {
228 cnq = &dev->cnq_array[i];
230 rc = qedr_alloc_mem_sb(dev, &dev->sb_array[i],
235 rc = dev->ops->common->chain_alloc(dev->cdev,
236 QED_CHAIN_USE_TO_CONSUME,
238 QED_CHAIN_CNT_TYPE_U16,
240 sizeof(struct regpair *),
246 cnq->sb = &dev->sb_array[i];
247 cons_pi = dev->sb_array[i].sb_virt->pi_array;
248 cnq->hw_cons_ptr = &cons_pi[QED_ROCE_PROTOCOL_INDEX];
250 sprintf(cnq->name, "qedr%d@pci:%s", i, pci_name(dev->pdev));
252 DP_DEBUG(dev, QEDR_MSG_INIT, "cnq[%d].cons=%d\n",
253 i, qed_chain_get_cons_idx(&cnq->pbl));
258 qedr_free_mem_sb(dev, &dev->sb_array[i], dev->sb_start + i);
260 for (--i; i >= 0; i--) {
261 dev->ops->common->chain_free(dev->cdev, &dev->cnq_array[i].pbl);
262 qedr_free_mem_sb(dev, &dev->sb_array[i], dev->sb_start + i);
264 kfree(dev->cnq_array);
266 kfree(dev->sb_array);
268 kfree(dev->sgid_tbl);
272 /* QEDR sysfs interface */
273 static ssize_t show_rev(struct device *device, struct device_attribute *attr,
276 struct qedr_dev *dev = dev_get_drvdata(device);
278 return scnprintf(buf, PAGE_SIZE, "0x%x\n", dev->pdev->vendor);
281 static ssize_t show_hca_type(struct device *device,
282 struct device_attribute *attr, char *buf)
284 return scnprintf(buf, PAGE_SIZE, "%s\n", "HCA_TYPE_TO_SET");
287 static DEVICE_ATTR(hw_rev, S_IRUGO, show_rev, NULL);
288 static DEVICE_ATTR(hca_type, S_IRUGO, show_hca_type, NULL);
290 static struct device_attribute *qedr_attributes[] = {
295 static void qedr_remove_sysfiles(struct qedr_dev *dev)
299 for (i = 0; i < ARRAY_SIZE(qedr_attributes); i++)
300 device_remove_file(&dev->ibdev.dev, qedr_attributes[i]);
303 static void qedr_pci_set_atomic(struct qedr_dev *dev, struct pci_dev *pdev)
305 struct pci_dev *bridge;
308 dev->atomic_cap = IB_ATOMIC_NONE;
310 bridge = pdev->bus->self;
314 /* Check whether we are connected directly or via a switch */
315 while (bridge && bridge->bus->parent) {
316 DP_DEBUG(dev, QEDR_MSG_INIT,
317 "Device is not connected directly to root. bridge->bus->number=%d primary=%d\n",
318 bridge->bus->number, bridge->bus->primary);
319 /* Need to check Atomic Op Routing Supported all the way to
322 pcie_capability_read_dword(bridge, PCI_EXP_DEVCAP2, &val);
323 if (!(val & PCI_EXP_DEVCAP2_ATOMIC_ROUTE)) {
324 pcie_capability_clear_word(pdev,
326 PCI_EXP_DEVCTL2_ATOMIC_REQ);
329 bridge = bridge->bus->parent->self;
331 bridge = pdev->bus->self;
333 /* according to bridge capability */
334 pcie_capability_read_dword(bridge, PCI_EXP_DEVCAP2, &val);
335 if (val & PCI_EXP_DEVCAP2_ATOMIC_COMP64) {
336 pcie_capability_set_word(pdev, PCI_EXP_DEVCTL2,
337 PCI_EXP_DEVCTL2_ATOMIC_REQ);
338 dev->atomic_cap = IB_ATOMIC_GLOB;
340 pcie_capability_clear_word(pdev, PCI_EXP_DEVCTL2,
341 PCI_EXP_DEVCTL2_ATOMIC_REQ);
345 static const struct qed_rdma_ops *qed_ops;
347 #define HILO_U64(hi, lo) ((((u64)(hi)) << 32) + (lo))
349 static irqreturn_t qedr_irq_handler(int irq, void *handle)
351 u16 hw_comp_cons, sw_comp_cons;
352 struct qedr_cnq *cnq = handle;
353 struct regpair *cq_handle;
356 qed_sb_ack(cnq->sb, IGU_INT_DISABLE, 0);
358 qed_sb_update_sb_idx(cnq->sb);
360 hw_comp_cons = le16_to_cpu(*cnq->hw_cons_ptr);
361 sw_comp_cons = qed_chain_get_cons_idx(&cnq->pbl);
363 /* Align protocol-index and chain reads */
366 while (sw_comp_cons != hw_comp_cons) {
367 cq_handle = (struct regpair *)qed_chain_consume(&cnq->pbl);
368 cq = (struct qedr_cq *)(uintptr_t)HILO_U64(cq_handle->hi,
373 "Received NULL CQ cq_handle->hi=%d cq_handle->lo=%d sw_comp_cons=%d hw_comp_cons=%d\n",
374 cq_handle->hi, cq_handle->lo, sw_comp_cons,
380 if (cq->sig != QEDR_CQ_MAGIC_NUMBER) {
382 "Problem with cq signature, cq_handle->hi=%d ch_handle->lo=%d cq=%p\n",
383 cq_handle->hi, cq_handle->lo, cq);
389 if (cq->ibcq.comp_handler)
390 (*cq->ibcq.comp_handler)
391 (&cq->ibcq, cq->ibcq.cq_context);
393 sw_comp_cons = qed_chain_get_cons_idx(&cnq->pbl);
399 qed_ops->rdma_cnq_prod_update(cnq->dev->rdma_ctx, cnq->index,
402 qed_sb_ack(cnq->sb, IGU_INT_ENABLE, 1);
407 static void qedr_sync_free_irqs(struct qedr_dev *dev)
412 for (i = 0; i < dev->int_info.used_cnt; i++) {
413 if (dev->int_info.msix_cnt) {
414 vector = dev->int_info.msix[i * dev->num_hwfns].vector;
415 synchronize_irq(vector);
416 free_irq(vector, &dev->cnq_array[i]);
420 dev->int_info.used_cnt = 0;
423 static int qedr_req_msix_irqs(struct qedr_dev *dev)
427 if (dev->num_cnq > dev->int_info.msix_cnt) {
429 "Interrupt mismatch: %d CNQ queues > %d MSI-x vectors\n",
430 dev->num_cnq, dev->int_info.msix_cnt);
434 for (i = 0; i < dev->num_cnq; i++) {
435 rc = request_irq(dev->int_info.msix[i * dev->num_hwfns].vector,
436 qedr_irq_handler, 0, dev->cnq_array[i].name,
439 DP_ERR(dev, "Request cnq %d irq failed\n", i);
440 qedr_sync_free_irqs(dev);
442 DP_DEBUG(dev, QEDR_MSG_INIT,
443 "Requested cnq irq for %s [entry %d]. Cookie is at %p\n",
444 dev->cnq_array[i].name, i,
446 dev->int_info.used_cnt++;
453 static int qedr_setup_irqs(struct qedr_dev *dev)
457 DP_DEBUG(dev, QEDR_MSG_INIT, "qedr_setup_irqs\n");
459 /* Learn Interrupt configuration */
460 rc = dev->ops->rdma_set_rdma_int(dev->cdev, dev->num_cnq);
464 rc = dev->ops->rdma_get_rdma_int(dev->cdev, &dev->int_info);
466 DP_DEBUG(dev, QEDR_MSG_INIT, "get_rdma_int failed\n");
470 if (dev->int_info.msix_cnt) {
471 DP_DEBUG(dev, QEDR_MSG_INIT, "rdma msix_cnt = %d\n",
472 dev->int_info.msix_cnt);
473 rc = qedr_req_msix_irqs(dev);
478 DP_DEBUG(dev, QEDR_MSG_INIT, "qedr_setup_irqs succeeded\n");
483 static int qedr_set_device_attr(struct qedr_dev *dev)
485 struct qed_rdma_device *qed_attr;
486 struct qedr_device_attr *attr;
489 /* Part 1 - query core capabilities */
490 qed_attr = dev->ops->rdma_query_device(dev->rdma_ctx);
492 /* Part 2 - check capabilities */
493 page_size = ~dev->attr.page_size_caps + 1;
494 if (page_size > PAGE_SIZE) {
496 "Kernel PAGE_SIZE is %ld which is smaller than minimum page size (%d) required by qedr\n",
497 PAGE_SIZE, page_size);
501 /* Part 3 - copy and update capabilities */
503 attr->vendor_id = qed_attr->vendor_id;
504 attr->vendor_part_id = qed_attr->vendor_part_id;
505 attr->hw_ver = qed_attr->hw_ver;
506 attr->fw_ver = qed_attr->fw_ver;
507 attr->node_guid = qed_attr->node_guid;
508 attr->sys_image_guid = qed_attr->sys_image_guid;
509 attr->max_cnq = qed_attr->max_cnq;
510 attr->max_sge = qed_attr->max_sge;
511 attr->max_inline = qed_attr->max_inline;
512 attr->max_sqe = min_t(u32, qed_attr->max_wqe, QEDR_MAX_SQE);
513 attr->max_rqe = min_t(u32, qed_attr->max_wqe, QEDR_MAX_RQE);
514 attr->max_qp_resp_rd_atomic_resc = qed_attr->max_qp_resp_rd_atomic_resc;
515 attr->max_qp_req_rd_atomic_resc = qed_attr->max_qp_req_rd_atomic_resc;
516 attr->max_dev_resp_rd_atomic_resc =
517 qed_attr->max_dev_resp_rd_atomic_resc;
518 attr->max_cq = qed_attr->max_cq;
519 attr->max_qp = qed_attr->max_qp;
520 attr->max_mr = qed_attr->max_mr;
521 attr->max_mr_size = qed_attr->max_mr_size;
522 attr->max_cqe = min_t(u64, qed_attr->max_cqe, QEDR_MAX_CQES);
523 attr->max_mw = qed_attr->max_mw;
524 attr->max_fmr = qed_attr->max_fmr;
525 attr->max_mr_mw_fmr_pbl = qed_attr->max_mr_mw_fmr_pbl;
526 attr->max_mr_mw_fmr_size = qed_attr->max_mr_mw_fmr_size;
527 attr->max_pd = qed_attr->max_pd;
528 attr->max_ah = qed_attr->max_ah;
529 attr->max_pkey = qed_attr->max_pkey;
530 attr->max_srq = qed_attr->max_srq;
531 attr->max_srq_wr = qed_attr->max_srq_wr;
532 attr->dev_caps = qed_attr->dev_caps;
533 attr->page_size_caps = qed_attr->page_size_caps;
534 attr->dev_ack_delay = qed_attr->dev_ack_delay;
535 attr->reserved_lkey = qed_attr->reserved_lkey;
536 attr->bad_pkey_counter = qed_attr->bad_pkey_counter;
537 attr->max_stats_queues = qed_attr->max_stats_queues;
542 static int qedr_init_hw(struct qedr_dev *dev)
544 struct qed_rdma_add_user_out_params out_params;
545 struct qed_rdma_start_in_params *in_params;
546 struct qed_rdma_cnq_params *cur_pbl;
547 struct qed_rdma_events events;
548 dma_addr_t p_phys_table;
553 in_params = kzalloc(sizeof(*in_params), GFP_KERNEL);
559 in_params->desired_cnq = dev->num_cnq;
560 for (i = 0; i < dev->num_cnq; i++) {
561 cur_pbl = &in_params->cnq_pbl_list[i];
563 page_cnt = qed_chain_get_page_cnt(&dev->cnq_array[i].pbl);
564 cur_pbl->num_pbl_pages = page_cnt;
566 p_phys_table = qed_chain_get_pbl_phys(&dev->cnq_array[i].pbl);
567 cur_pbl->pbl_ptr = (u64)p_phys_table;
570 events.context = dev;
572 in_params->events = &events;
573 in_params->cq_mode = QED_RDMA_CQ_MODE_32_BITS;
574 in_params->max_mtu = dev->ndev->mtu;
575 ether_addr_copy(&in_params->mac_addr[0], dev->ndev->dev_addr);
577 rc = dev->ops->rdma_init(dev->cdev, in_params);
581 rc = dev->ops->rdma_add_user(dev->rdma_ctx, &out_params);
585 dev->db_addr = (void *)(uintptr_t)out_params.dpi_addr;
586 dev->db_phys_addr = out_params.dpi_phys_addr;
587 dev->db_size = out_params.dpi_size;
588 dev->dpi = out_params.dpi;
590 rc = qedr_set_device_attr(dev);
594 DP_ERR(dev, "Init HW Failed rc = %d\n", rc);
599 void qedr_stop_hw(struct qedr_dev *dev)
601 dev->ops->rdma_remove_user(dev->rdma_ctx, dev->dpi);
602 dev->ops->rdma_stop(dev->rdma_ctx);
605 static struct qedr_dev *qedr_add(struct qed_dev *cdev, struct pci_dev *pdev,
606 struct net_device *ndev)
608 struct qed_dev_rdma_info dev_info;
609 struct qedr_dev *dev;
612 dev = (struct qedr_dev *)ib_alloc_device(sizeof(*dev));
614 pr_err("Unable to allocate ib device\n");
618 DP_DEBUG(dev, QEDR_MSG_INIT, "qedr add device called\n");
624 qed_ops = qed_get_rdma_ops();
626 DP_ERR(dev, "Failed to get qed roce operations\n");
631 rc = qed_ops->fill_dev_info(cdev, &dev_info);
635 dev->num_hwfns = dev_info.common.num_hwfns;
636 dev->rdma_ctx = dev->ops->rdma_get_rdma_ctx(cdev);
638 dev->num_cnq = dev->ops->rdma_get_min_cnq_msix(cdev);
640 DP_ERR(dev, "not enough CNQ resources.\n");
644 dev->wq_multiplier = QEDR_WQ_MULTIPLIER_DFT;
646 qedr_pci_set_atomic(dev, pdev);
648 rc = qedr_alloc_resources(dev);
652 rc = qedr_init_hw(dev);
656 rc = qedr_setup_irqs(dev);
660 rc = qedr_register_device(dev);
662 DP_ERR(dev, "Unable to allocate register device\n");
666 for (i = 0; i < ARRAY_SIZE(qedr_attributes); i++)
667 if (device_create_file(&dev->ibdev.dev, qedr_attributes[i]))
670 DP_DEBUG(dev, QEDR_MSG_INIT, "qedr driver loaded successfully\n");
674 qedr_sync_free_irqs(dev);
678 qedr_free_resources(dev);
680 ib_dealloc_device(&dev->ibdev);
681 DP_ERR(dev, "qedr driver load failed rc=%d\n", rc);
686 static void qedr_remove(struct qedr_dev *dev)
688 /* First unregister with stack to stop all the active traffic
689 * of the registered clients.
691 qedr_remove_sysfiles(dev);
694 qedr_sync_free_irqs(dev);
695 qedr_free_resources(dev);
696 ib_dealloc_device(&dev->ibdev);
699 static int qedr_close(struct qedr_dev *dev)
701 qedr_ib_dispatch_event(dev, 1, IB_EVENT_PORT_ERR);
706 static void qedr_shutdown(struct qedr_dev *dev)
712 /* event handling via NIC driver ensures that all the NIC specific
713 * initialization done before RoCE driver notifies
716 static void qedr_notify(struct qedr_dev *dev, enum qede_roce_event event)
720 qedr_ib_dispatch_event(dev, 1, IB_EVENT_PORT_ACTIVE);
728 case QEDE_CHANGE_ADDR:
729 qedr_ib_dispatch_event(dev, 1, IB_EVENT_GID_CHANGE);
732 pr_err("Event not supported\n");
736 static struct qedr_driver qedr_drv = {
737 .name = "qedr_driver",
739 .remove = qedr_remove,
740 .notify = qedr_notify,
743 static int __init qedr_init_module(void)
745 return qede_roce_register_driver(&qedr_drv);
748 static void __exit qedr_exit_module(void)
750 qede_roce_unregister_driver(&qedr_drv);
753 module_init(qedr_init_module);
754 module_exit(qedr_exit_module);