1 /* This file is part of the Emulex RoCE Device Driver for
2 * RoCE (RDMA over Converged Ethernet) adapters.
3 * Copyright (C) 2012-2015 Emulex. All rights reserved.
4 * EMULEX and SLI are trademarks of Emulex.
7 * This software is available to you under a choice of one of two licenses.
8 * You may choose to be licensed under the terms of the GNU General Public
9 * License (GPL) Version 2, available from the file COPYING in the main
10 * directory of this source tree, or the BSD license below:
12 * Redistribution and use in source and binary forms, with or without
13 * modification, are permitted provided that the following conditions
16 * - Redistributions of source code must retain the above copyright notice,
17 * this list of conditions and the following disclaimer.
19 * - Redistributions in binary form must reproduce the above copyright
20 * notice, this list of conditions and the following disclaimer in
21 * the documentation and/or other materials provided with the distribution.
23 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
24 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
27 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
30 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
31 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
32 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
33 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
35 * Contact Information:
36 * linux-drivers@emulex.com
40 * Costa Mesa, CA 92626
43 #include <linux/module.h>
44 #include <linux/idr.h>
45 #include <rdma/ib_verbs.h>
46 #include <rdma/ib_user_verbs.h>
47 #include <rdma/ib_addr.h>
48 #include <rdma/ib_mad.h>
50 #include <linux/netdevice.h>
51 #include <net/addrconf.h>
54 #include "ocrdma_verbs.h"
55 #include "ocrdma_ah.h"
57 #include "ocrdma_hw.h"
58 #include "ocrdma_stats.h"
59 #include <rdma/ocrdma-abi.h>
61 MODULE_DESCRIPTION(OCRDMA_ROCE_DRV_DESC
" " OCRDMA_ROCE_DRV_VERSION
);
62 MODULE_AUTHOR("Emulex Corporation");
63 MODULE_LICENSE("Dual BSD/GPL");
65 static enum rdma_link_layer
ocrdma_link_layer(struct ib_device
*device
,
68 return IB_LINK_LAYER_ETHERNET
;
71 static int ocrdma_port_immutable(struct ib_device
*ibdev
, u32 port_num
,
72 struct ib_port_immutable
*immutable
)
74 struct ib_port_attr attr
;
75 struct ocrdma_dev
*dev
;
78 dev
= get_ocrdma_dev(ibdev
);
79 immutable
->core_cap_flags
= RDMA_CORE_PORT_IBA_ROCE
;
80 if (ocrdma_is_udp_encap_supported(dev
))
81 immutable
->core_cap_flags
|= RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP
;
83 err
= ib_query_port(ibdev
, port_num
, &attr
);
87 immutable
->pkey_tbl_len
= attr
.pkey_tbl_len
;
88 immutable
->gid_tbl_len
= attr
.gid_tbl_len
;
89 immutable
->max_mad_size
= IB_MGMT_MAD_SIZE
;
94 static void get_dev_fw_str(struct ib_device
*device
, char *str
)
96 struct ocrdma_dev
*dev
= get_ocrdma_dev(device
);
98 snprintf(str
, IB_FW_VERSION_NAME_MAX
, "%s", &dev
->attr
.fw_ver
[0]);
101 /* OCRDMA sysfs interface */
102 static ssize_t
hw_rev_show(struct device
*device
,
103 struct device_attribute
*attr
, char *buf
)
105 struct ocrdma_dev
*dev
=
106 rdma_device_to_drv_device(device
, struct ocrdma_dev
, ibdev
);
108 return sysfs_emit(buf
, "0x%x\n", dev
->nic_info
.pdev
->vendor
);
110 static DEVICE_ATTR_RO(hw_rev
);
112 static ssize_t
hca_type_show(struct device
*device
,
113 struct device_attribute
*attr
, char *buf
)
115 struct ocrdma_dev
*dev
=
116 rdma_device_to_drv_device(device
, struct ocrdma_dev
, ibdev
);
118 return sysfs_emit(buf
, "%s\n", &dev
->model_number
[0]);
120 static DEVICE_ATTR_RO(hca_type
);
122 static struct attribute
*ocrdma_attributes
[] = {
123 &dev_attr_hw_rev
.attr
,
124 &dev_attr_hca_type
.attr
,
128 static const struct attribute_group ocrdma_attr_group
= {
129 .attrs
= ocrdma_attributes
,
132 static const struct ib_device_ops ocrdma_dev_ops
= {
133 .owner
= THIS_MODULE
,
134 .driver_id
= RDMA_DRIVER_OCRDMA
,
135 .uverbs_abi_ver
= OCRDMA_ABI_VERSION
,
137 .alloc_mr
= ocrdma_alloc_mr
,
138 .alloc_pd
= ocrdma_alloc_pd
,
139 .alloc_ucontext
= ocrdma_alloc_ucontext
,
140 .create_ah
= ocrdma_create_ah
,
141 .create_cq
= ocrdma_create_cq
,
142 .create_qp
= ocrdma_create_qp
,
143 .create_user_ah
= ocrdma_create_ah
,
144 .dealloc_pd
= ocrdma_dealloc_pd
,
145 .dealloc_ucontext
= ocrdma_dealloc_ucontext
,
146 .dereg_mr
= ocrdma_dereg_mr
,
147 .destroy_ah
= ocrdma_destroy_ah
,
148 .destroy_cq
= ocrdma_destroy_cq
,
149 .destroy_qp
= ocrdma_destroy_qp
,
150 .device_group
= &ocrdma_attr_group
,
151 .get_dev_fw_str
= get_dev_fw_str
,
152 .get_dma_mr
= ocrdma_get_dma_mr
,
153 .get_link_layer
= ocrdma_link_layer
,
154 .get_port_immutable
= ocrdma_port_immutable
,
155 .map_mr_sg
= ocrdma_map_mr_sg
,
157 .modify_qp
= ocrdma_modify_qp
,
158 .poll_cq
= ocrdma_poll_cq
,
159 .post_recv
= ocrdma_post_recv
,
160 .post_send
= ocrdma_post_send
,
161 .process_mad
= ocrdma_process_mad
,
162 .query_ah
= ocrdma_query_ah
,
163 .query_device
= ocrdma_query_device
,
164 .query_pkey
= ocrdma_query_pkey
,
165 .query_port
= ocrdma_query_port
,
166 .query_qp
= ocrdma_query_qp
,
167 .reg_user_mr
= ocrdma_reg_user_mr
,
168 .req_notify_cq
= ocrdma_arm_cq
,
169 .resize_cq
= ocrdma_resize_cq
,
171 INIT_RDMA_OBJ_SIZE(ib_ah
, ocrdma_ah
, ibah
),
172 INIT_RDMA_OBJ_SIZE(ib_cq
, ocrdma_cq
, ibcq
),
173 INIT_RDMA_OBJ_SIZE(ib_pd
, ocrdma_pd
, ibpd
),
174 INIT_RDMA_OBJ_SIZE(ib_qp
, ocrdma_qp
, ibqp
),
175 INIT_RDMA_OBJ_SIZE(ib_ucontext
, ocrdma_ucontext
, ibucontext
),
178 static const struct ib_device_ops ocrdma_dev_srq_ops
= {
179 .create_srq
= ocrdma_create_srq
,
180 .destroy_srq
= ocrdma_destroy_srq
,
181 .modify_srq
= ocrdma_modify_srq
,
182 .post_srq_recv
= ocrdma_post_srq_recv
,
183 .query_srq
= ocrdma_query_srq
,
185 INIT_RDMA_OBJ_SIZE(ib_srq
, ocrdma_srq
, ibsrq
),
188 static int ocrdma_register_device(struct ocrdma_dev
*dev
)
192 addrconf_addr_eui48((u8
*)&dev
->ibdev
.node_guid
,
193 dev
->nic_info
.mac_addr
);
194 BUILD_BUG_ON(sizeof(OCRDMA_NODE_DESC
) > IB_DEVICE_NODE_DESC_MAX
);
195 memcpy(dev
->ibdev
.node_desc
, OCRDMA_NODE_DESC
,
196 sizeof(OCRDMA_NODE_DESC
));
198 dev
->ibdev
.node_type
= RDMA_NODE_IB_CA
;
199 dev
->ibdev
.phys_port_cnt
= 1;
200 dev
->ibdev
.num_comp_vectors
= dev
->eq_cnt
;
202 /* mandatory to support user space verbs consumer. */
203 dev
->ibdev
.dev
.parent
= &dev
->nic_info
.pdev
->dev
;
205 ib_set_device_ops(&dev
->ibdev
, &ocrdma_dev_ops
);
207 if (ocrdma_get_asic_type(dev
) == OCRDMA_ASIC_GEN_SKH_R
)
208 ib_set_device_ops(&dev
->ibdev
, &ocrdma_dev_srq_ops
);
210 ret
= ib_device_set_netdev(&dev
->ibdev
, dev
->nic_info
.netdev
, 1);
214 dma_set_max_seg_size(&dev
->nic_info
.pdev
->dev
, UINT_MAX
);
215 return ib_register_device(&dev
->ibdev
, "ocrdma%d",
216 &dev
->nic_info
.pdev
->dev
);
219 static int ocrdma_alloc_resources(struct ocrdma_dev
*dev
)
221 mutex_init(&dev
->dev_lock
);
222 dev
->cq_tbl
= kcalloc(OCRDMA_MAX_CQ
, sizeof(struct ocrdma_cq
*),
227 if (dev
->attr
.max_qp
) {
228 dev
->qp_tbl
= kcalloc(OCRDMA_MAX_QP
,
229 sizeof(struct ocrdma_qp
*),
235 dev
->stag_arr
= kcalloc(OCRDMA_MAX_STAG
, sizeof(u64
), GFP_KERNEL
);
236 if (dev
->stag_arr
== NULL
)
239 ocrdma_alloc_pd_pool(dev
);
241 if (!ocrdma_alloc_stats_resources(dev
)) {
242 pr_err("%s: stats resource allocation failed\n", __func__
);
246 spin_lock_init(&dev
->av_tbl
.lock
);
247 spin_lock_init(&dev
->flush_q_lock
);
250 pr_err("%s(%d) error.\n", __func__
, dev
->id
);
254 static void ocrdma_free_resources(struct ocrdma_dev
*dev
)
256 ocrdma_release_stats_resources(dev
);
257 kfree(dev
->stag_arr
);
262 static struct ocrdma_dev
*ocrdma_add(struct be_dev_info
*dev_info
)
266 struct ocrdma_dev
*dev
;
268 dev
= ib_alloc_device(ocrdma_dev
, ibdev
);
270 pr_err("Unable to allocate ib device\n");
274 dev
->mbx_cmd
= kzalloc(sizeof(struct ocrdma_mqe_emb_cmd
), GFP_KERNEL
);
278 memcpy(&dev
->nic_info
, dev_info
, sizeof(*dev_info
));
279 dev
->id
= PCI_FUNC(dev
->nic_info
.pdev
->devfn
);
280 status
= ocrdma_init_hw(dev
);
284 status
= ocrdma_alloc_resources(dev
);
288 ocrdma_init_service_level(dev
);
289 status
= ocrdma_register_device(dev
);
293 /* Query Link state and update */
294 status
= ocrdma_mbx_get_link_speed(dev
, NULL
, &lstate
);
296 ocrdma_update_link_state(dev
, lstate
);
299 ocrdma_add_port_stats(dev
);
300 /* Interrupt Moderation */
301 INIT_DELAYED_WORK(&dev
->eqd_work
, ocrdma_eqd_set_task
);
302 schedule_delayed_work(&dev
->eqd_work
, msecs_to_jiffies(1000));
304 pr_info("%s %s: %s \"%s\" port %d\n",
305 dev_name(&dev
->nic_info
.pdev
->dev
), hca_name(dev
),
306 port_speed_string(dev
), dev
->model_number
,
308 pr_info("%s ocrdma%d driver loaded successfully\n",
309 dev_name(&dev
->nic_info
.pdev
->dev
), dev
->id
);
313 ocrdma_free_resources(dev
);
314 ocrdma_cleanup_hw(dev
);
317 ib_dealloc_device(&dev
->ibdev
);
318 pr_err("%s() leaving. ret=%d\n", __func__
, status
);
322 static void ocrdma_remove_free(struct ocrdma_dev
*dev
)
326 ib_dealloc_device(&dev
->ibdev
);
329 static void ocrdma_remove(struct ocrdma_dev
*dev
)
331 /* first unregister with stack to stop all the active traffic
332 * of the registered clients.
334 cancel_delayed_work_sync(&dev
->eqd_work
);
335 ib_unregister_device(&dev
->ibdev
);
337 ocrdma_rem_port_stats(dev
);
338 ocrdma_free_resources(dev
);
339 ocrdma_cleanup_hw(dev
);
340 ocrdma_remove_free(dev
);
343 static int ocrdma_dispatch_port_active(struct ocrdma_dev
*dev
)
345 struct ib_event port_event
;
347 port_event
.event
= IB_EVENT_PORT_ACTIVE
;
348 port_event
.element
.port_num
= 1;
349 port_event
.device
= &dev
->ibdev
;
350 ib_dispatch_event(&port_event
);
354 static int ocrdma_dispatch_port_error(struct ocrdma_dev
*dev
)
356 struct ib_event err_event
;
358 err_event
.event
= IB_EVENT_PORT_ERR
;
359 err_event
.element
.port_num
= 1;
360 err_event
.device
= &dev
->ibdev
;
361 ib_dispatch_event(&err_event
);
365 static void ocrdma_shutdown(struct ocrdma_dev
*dev
)
367 ocrdma_dispatch_port_error(dev
);
371 /* event handling via NIC driver ensures that all the NIC specific
372 * initialization done before RoCE driver notifies
375 static void ocrdma_event_handler(struct ocrdma_dev
*dev
, u32 event
)
378 case BE_DEV_SHUTDOWN
:
379 ocrdma_shutdown(dev
);
386 void ocrdma_update_link_state(struct ocrdma_dev
*dev
, u8 lstate
)
388 if (!(dev
->flags
& OCRDMA_FLAGS_LINK_STATUS_INIT
)) {
389 dev
->flags
|= OCRDMA_FLAGS_LINK_STATUS_INIT
;
395 ocrdma_dispatch_port_error(dev
);
397 ocrdma_dispatch_port_active(dev
);
400 static struct ocrdma_driver ocrdma_drv
= {
401 .name
= "ocrdma_driver",
403 .remove
= ocrdma_remove
,
404 .state_change_handler
= ocrdma_event_handler
,
405 .be_abi_version
= OCRDMA_BE_ROCE_ABI_VERSION
,
408 static int __init
ocrdma_init_module(void)
412 ocrdma_init_debugfs();
414 status
= be_roce_register_driver(&ocrdma_drv
);
425 static void __exit
ocrdma_exit_module(void)
427 be_roce_unregister_driver(&ocrdma_drv
);
428 ocrdma_rem_debugfs();
431 module_init(ocrdma_init_module
);
432 module_exit(ocrdma_exit_module
);