2 * Copyright(c) 2016 - 2018 Intel Corporation.
4 * This file is provided under a dual BSD/GPLv2 license. When using or
5 * redistributing this file, you may do so under either license.
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of version 2 of the GNU General Public License as
11 * published by the Free Software Foundation.
13 * This program is distributed in the hope that it will be useful, but
14 * WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * General Public License for more details.
20 * Redistribution and use in source and binary forms, with or without
21 * modification, are permitted provided that the following conditions
24 * - Redistributions of source code must retain the above copyright
25 * notice, this list of conditions and the following disclaimer.
26 * - Redistributions in binary form must reproduce the above copyright
27 * notice, this list of conditions and the following disclaimer in
28 * the documentation and/or other materials provided with the
30 * - Neither the name of Intel Corporation nor the names of its
31 * contributors may be used to endorse or promote products derived
32 * from this software without specific prior written permission.
34 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
35 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
36 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
37 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
38 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
39 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
40 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
41 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
42 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
43 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
44 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
48 #include <linux/module.h>
49 #include <linux/kernel.h>
50 #include <linux/dma-mapping.h>
55 #define RVT_UVERBS_ABI_VERSION 2
57 MODULE_LICENSE("Dual BSD/GPL");
58 MODULE_DESCRIPTION("RDMA Verbs Transport Library");
60 static int rvt_init(void)
62 int ret
= rvt_driver_cq_init();
65 pr_err("Error in driver CQ init.\n");
69 module_init(rvt_init
);
71 static void rvt_cleanup(void)
75 module_exit(rvt_cleanup
);
78 * rvt_alloc_device - allocate rdi
79 * @size: how big of a structure to allocate
80 * @nports: number of ports to allocate array slots for
82 * Use IB core device alloc to allocate space for the rdi which is assumed to be
83 * inside of the ib_device. Any extra space that drivers require should be
86 * We also allocate a port array based on the number of ports.
88 * Return: pointer to allocated rdi
90 struct rvt_dev_info
*rvt_alloc_device(size_t size
, int nports
)
92 struct rvt_dev_info
*rdi
;
94 rdi
= container_of(_ib_alloc_device(size
), struct rvt_dev_info
, ibdev
);
98 rdi
->ports
= kcalloc(nports
, sizeof(*rdi
->ports
), GFP_KERNEL
);
100 ib_dealloc_device(&rdi
->ibdev
);
104 EXPORT_SYMBOL(rvt_alloc_device
);
107 * rvt_dealloc_device - deallocate rdi
108 * @rdi: structure to free
110 * Free a structure allocated with rvt_alloc_device()
112 void rvt_dealloc_device(struct rvt_dev_info
*rdi
)
115 ib_dealloc_device(&rdi
->ibdev
);
117 EXPORT_SYMBOL(rvt_dealloc_device
);
119 static int rvt_query_device(struct ib_device
*ibdev
,
120 struct ib_device_attr
*props
,
121 struct ib_udata
*uhw
)
123 struct rvt_dev_info
*rdi
= ib_to_rvt(ibdev
);
125 if (uhw
->inlen
|| uhw
->outlen
)
128 * Return rvt_dev_info.dparms.props contents
130 *props
= rdi
->dparms
.props
;
134 static int rvt_modify_device(struct ib_device
*device
,
135 int device_modify_mask
,
136 struct ib_device_modify
*device_modify
)
139 * There is currently no need to supply this based on qib and hfi1.
140 * Future drivers may need to implement this though.
147 * rvt_query_port: Passes the query port call to the driver
148 * @ibdev: Verbs IB dev
149 * @port_num: port number, 1 based from ib core
150 * @props: structure to hold returned properties
152 * Return: 0 on success
154 static int rvt_query_port(struct ib_device
*ibdev
, u8 port_num
,
155 struct ib_port_attr
*props
)
157 struct rvt_dev_info
*rdi
= ib_to_rvt(ibdev
);
158 struct rvt_ibport
*rvp
;
159 int port_index
= ibport_num_to_idx(ibdev
, port_num
);
164 rvp
= rdi
->ports
[port_index
];
165 /* props being zeroed by the caller, avoid zeroing it here */
166 props
->sm_lid
= rvp
->sm_lid
;
167 props
->sm_sl
= rvp
->sm_sl
;
168 props
->port_cap_flags
= rvp
->port_cap_flags
;
169 props
->max_msg_sz
= 0x80000000;
170 props
->pkey_tbl_len
= rvt_get_npkeys(rdi
);
171 props
->bad_pkey_cntr
= rvp
->pkey_violations
;
172 props
->qkey_viol_cntr
= rvp
->qkey_violations
;
173 props
->subnet_timeout
= rvp
->subnet_timeout
;
174 props
->init_type_reply
= 0;
176 /* Populate the remaining ib_port_attr elements */
177 return rdi
->driver_f
.query_port_state(rdi
, port_num
, props
);
182 * @ibdev: Verbs IB dev
183 * @port_num: Port number, 1 based from ib core
184 * @port_modify_mask: How to change the port
185 * @props: Structure to fill in
187 * Return: 0 on success
189 static int rvt_modify_port(struct ib_device
*ibdev
, u8 port_num
,
190 int port_modify_mask
, struct ib_port_modify
*props
)
192 struct rvt_dev_info
*rdi
= ib_to_rvt(ibdev
);
193 struct rvt_ibport
*rvp
;
195 int port_index
= ibport_num_to_idx(ibdev
, port_num
);
200 rvp
= rdi
->ports
[port_index
];
201 if (port_modify_mask
& IB_PORT_OPA_MASK_CHG
) {
202 rvp
->port_cap3_flags
|= props
->set_port_cap_mask
;
203 rvp
->port_cap3_flags
&= ~props
->clr_port_cap_mask
;
205 rvp
->port_cap_flags
|= props
->set_port_cap_mask
;
206 rvp
->port_cap_flags
&= ~props
->clr_port_cap_mask
;
209 if (props
->set_port_cap_mask
|| props
->clr_port_cap_mask
)
210 rdi
->driver_f
.cap_mask_chg(rdi
, port_num
);
211 if (port_modify_mask
& IB_PORT_SHUTDOWN
)
212 ret
= rdi
->driver_f
.shut_down_port(rdi
, port_num
);
213 if (port_modify_mask
& IB_PORT_RESET_QKEY_CNTR
)
214 rvp
->qkey_violations
= 0;
220 * rvt_query_pkey - Return a pkey from the table at a given index
221 * @ibdev: Verbs IB dev
222 * @port_num: Port number, 1 based from ib core
223 * @index: Index into pkey table
224 * @pkey: returned pkey from the port pkey table
226 * Return: 0 on failure pkey otherwise
228 static int rvt_query_pkey(struct ib_device
*ibdev
, u8 port_num
, u16 index
,
232 * Driver will be responsible for keeping rvt_dev_info.pkey_table up to
233 * date. This function will just return that value. There is no need to
234 * lock, if a stale value is read and sent to the user so be it there is
235 * no way to protect against that anyway.
237 struct rvt_dev_info
*rdi
= ib_to_rvt(ibdev
);
240 port_index
= ibport_num_to_idx(ibdev
, port_num
);
244 if (index
>= rvt_get_npkeys(rdi
))
247 *pkey
= rvt_get_pkey(rdi
, port_index
, index
);
252 * rvt_query_gid - Return a gid from the table
253 * @ibdev: Verbs IB dev
254 * @port_num: Port number, 1 based from ib core
255 * @guid_index: Index in table
256 * @gid: Gid to return
258 * Return: 0 on success
260 static int rvt_query_gid(struct ib_device
*ibdev
, u8 port_num
,
261 int guid_index
, union ib_gid
*gid
)
263 struct rvt_dev_info
*rdi
;
264 struct rvt_ibport
*rvp
;
268 * Driver is responsible for updating the guid table. Which will be used
269 * to craft the return value. This will work similar to how query_pkey()
272 port_index
= ibport_num_to_idx(ibdev
, port_num
);
276 rdi
= ib_to_rvt(ibdev
);
277 rvp
= rdi
->ports
[port_index
];
279 gid
->global
.subnet_prefix
= rvp
->gid_prefix
;
281 return rdi
->driver_f
.get_guid_be(rdi
, rvp
, guid_index
,
282 &gid
->global
.interface_id
);
286 * rvt_alloc_ucontext - Allocate a user context
287 * @uctx: Verbs context
288 * @udata: User data allocated
290 static int rvt_alloc_ucontext(struct ib_ucontext
*uctx
, struct ib_udata
*udata
)
296 * rvt_dealloc_ucontext - Free a user context
297 * @context - Free this
299 static void rvt_dealloc_ucontext(struct ib_ucontext
*context
)
304 static int rvt_get_port_immutable(struct ib_device
*ibdev
, u8 port_num
,
305 struct ib_port_immutable
*immutable
)
307 struct rvt_dev_info
*rdi
= ib_to_rvt(ibdev
);
308 struct ib_port_attr attr
;
311 port_index
= ibport_num_to_idx(ibdev
, port_num
);
315 immutable
->core_cap_flags
= rdi
->dparms
.core_cap_flags
;
317 err
= ib_query_port(ibdev
, port_num
, &attr
);
321 immutable
->pkey_tbl_len
= attr
.pkey_tbl_len
;
322 immutable
->gid_tbl_len
= attr
.gid_tbl_len
;
323 immutable
->max_mad_size
= rdi
->dparms
.max_mad_size
;
373 _VERB_IDX_MAX
/* Must always be last! */
376 static const struct ib_device_ops rvt_dev_ops
= {
377 .uverbs_abi_ver
= RVT_UVERBS_ABI_VERSION
,
379 .alloc_mr
= rvt_alloc_mr
,
380 .alloc_pd
= rvt_alloc_pd
,
381 .alloc_ucontext
= rvt_alloc_ucontext
,
382 .attach_mcast
= rvt_attach_mcast
,
383 .create_ah
= rvt_create_ah
,
384 .create_cq
= rvt_create_cq
,
385 .create_qp
= rvt_create_qp
,
386 .create_srq
= rvt_create_srq
,
387 .create_user_ah
= rvt_create_ah
,
388 .dealloc_pd
= rvt_dealloc_pd
,
389 .dealloc_ucontext
= rvt_dealloc_ucontext
,
390 .dereg_mr
= rvt_dereg_mr
,
391 .destroy_ah
= rvt_destroy_ah
,
392 .destroy_cq
= rvt_destroy_cq
,
393 .destroy_qp
= rvt_destroy_qp
,
394 .destroy_srq
= rvt_destroy_srq
,
395 .detach_mcast
= rvt_detach_mcast
,
396 .get_dma_mr
= rvt_get_dma_mr
,
397 .get_port_immutable
= rvt_get_port_immutable
,
398 .map_mr_sg
= rvt_map_mr_sg
,
400 .modify_ah
= rvt_modify_ah
,
401 .modify_device
= rvt_modify_device
,
402 .modify_port
= rvt_modify_port
,
403 .modify_qp
= rvt_modify_qp
,
404 .modify_srq
= rvt_modify_srq
,
405 .poll_cq
= rvt_poll_cq
,
406 .post_recv
= rvt_post_recv
,
407 .post_send
= rvt_post_send
,
408 .post_srq_recv
= rvt_post_srq_recv
,
409 .query_ah
= rvt_query_ah
,
410 .query_device
= rvt_query_device
,
411 .query_gid
= rvt_query_gid
,
412 .query_pkey
= rvt_query_pkey
,
413 .query_port
= rvt_query_port
,
414 .query_qp
= rvt_query_qp
,
415 .query_srq
= rvt_query_srq
,
416 .reg_user_mr
= rvt_reg_user_mr
,
417 .req_notify_cq
= rvt_req_notify_cq
,
418 .resize_cq
= rvt_resize_cq
,
420 INIT_RDMA_OBJ_SIZE(ib_ah
, rvt_ah
, ibah
),
421 INIT_RDMA_OBJ_SIZE(ib_cq
, rvt_cq
, ibcq
),
422 INIT_RDMA_OBJ_SIZE(ib_pd
, rvt_pd
, ibpd
),
423 INIT_RDMA_OBJ_SIZE(ib_srq
, rvt_srq
, ibsrq
),
424 INIT_RDMA_OBJ_SIZE(ib_ucontext
, rvt_ucontext
, ibucontext
),
427 static noinline
int check_support(struct rvt_dev_info
*rdi
, int verb
)
432 * These functions are not part of verbs specifically but are
433 * required for rdmavt to function.
435 if ((!rdi
->ibdev
.ops
.init_port
) ||
436 (!rdi
->driver_f
.get_pci_dev
))
442 * rdmavt does not support modify device currently drivers must
445 if (!rdi
->ibdev
.ops
.modify_device
)
450 if (!rdi
->ibdev
.ops
.query_port
)
451 if (!rdi
->driver_f
.query_port_state
)
456 if (!rdi
->ibdev
.ops
.modify_port
)
457 if (!rdi
->driver_f
.cap_mask_chg
||
458 !rdi
->driver_f
.shut_down_port
)
463 if (!rdi
->ibdev
.ops
.query_gid
)
464 if (!rdi
->driver_f
.get_guid_be
)
469 if (!rdi
->ibdev
.ops
.create_qp
)
470 if (!rdi
->driver_f
.qp_priv_alloc
||
471 !rdi
->driver_f
.qp_priv_free
||
472 !rdi
->driver_f
.notify_qp_reset
||
473 !rdi
->driver_f
.flush_qp_waiters
||
474 !rdi
->driver_f
.stop_send_queue
||
475 !rdi
->driver_f
.quiesce_qp
)
480 if (!rdi
->ibdev
.ops
.modify_qp
)
481 if (!rdi
->driver_f
.notify_qp_reset
||
482 !rdi
->driver_f
.schedule_send
||
483 !rdi
->driver_f
.get_pmtu_from_attr
||
484 !rdi
->driver_f
.flush_qp_waiters
||
485 !rdi
->driver_f
.stop_send_queue
||
486 !rdi
->driver_f
.quiesce_qp
||
487 !rdi
->driver_f
.notify_error_qp
||
488 !rdi
->driver_f
.mtu_from_qp
||
489 !rdi
->driver_f
.mtu_to_path_mtu
)
494 if (!rdi
->ibdev
.ops
.destroy_qp
)
495 if (!rdi
->driver_f
.qp_priv_free
||
496 !rdi
->driver_f
.notify_qp_reset
||
497 !rdi
->driver_f
.flush_qp_waiters
||
498 !rdi
->driver_f
.stop_send_queue
||
499 !rdi
->driver_f
.quiesce_qp
)
504 if (!rdi
->ibdev
.ops
.post_send
)
505 if (!rdi
->driver_f
.schedule_send
||
506 !rdi
->driver_f
.do_send
||
517 * rvt_register_device - register a driver
518 * @rdi: main dev structure for all of rdmavt operations
520 * It is up to drivers to allocate the rdi and fill in the appropriate
523 * Return: 0 on success otherwise an errno.
525 int rvt_register_device(struct rvt_dev_info
*rdi
)
533 * Check to ensure drivers have setup the required helpers for the verbs
534 * they want rdmavt to handle
536 for (i
= 0; i
< _VERB_IDX_MAX
; i
++)
537 if (check_support(rdi
, i
)) {
538 pr_err("Driver support req not met at %d\n", i
);
542 ib_set_device_ops(&rdi
->ibdev
, &rvt_dev_ops
);
544 /* Once we get past here we can use rvt_pr macros and tracepoints */
545 trace_rvt_dbg(rdi
, "Driver attempting registration");
549 ret
= rvt_driver_qp_init(rdi
);
551 pr_err("Error in driver QP init.\n");
556 spin_lock_init(&rdi
->n_ahs_lock
);
557 rdi
->n_ahs_allocated
= 0;
559 /* Shared Receive Queue */
560 rvt_driver_srq_init(rdi
);
563 rvt_driver_mcast_init(rdi
);
566 ret
= rvt_driver_mr_init(rdi
);
568 pr_err("Error in driver MR init.\n");
572 /* Memory Working Set Size */
573 ret
= rvt_wss_init(rdi
);
575 rvt_pr_err(rdi
, "Error in WSS init.\n");
579 /* Completion queues */
580 spin_lock_init(&rdi
->n_cqs_lock
);
582 /* Protection Domain */
583 spin_lock_init(&rdi
->n_pds_lock
);
584 rdi
->n_pds_allocated
= 0;
587 * There are some things which could be set by underlying drivers but
588 * really should be up to rdmavt to set. For instance drivers can't know
589 * exactly which functions rdmavt supports, nor do they know the ABI
590 * version, so we do all of this sort of stuff here.
592 rdi
->ibdev
.uverbs_cmd_mask
|=
593 (1ull << IB_USER_VERBS_CMD_POLL_CQ
) |
594 (1ull << IB_USER_VERBS_CMD_REQ_NOTIFY_CQ
) |
595 (1ull << IB_USER_VERBS_CMD_POST_SEND
) |
596 (1ull << IB_USER_VERBS_CMD_POST_RECV
) |
597 (1ull << IB_USER_VERBS_CMD_POST_SRQ_RECV
);
598 rdi
->ibdev
.node_type
= RDMA_NODE_IB_CA
;
599 if (!rdi
->ibdev
.num_comp_vectors
)
600 rdi
->ibdev
.num_comp_vectors
= 1;
602 /* We are now good to announce we exist */
603 ret
= ib_register_device(&rdi
->ibdev
, dev_name(&rdi
->ibdev
.dev
), NULL
);
605 rvt_pr_err(rdi
, "Failed to register driver with ib core.\n");
609 rvt_create_mad_agents(rdi
);
611 rvt_pr_info(rdi
, "Registration with rdmavt done.\n");
624 EXPORT_SYMBOL(rvt_register_device
);
627 * rvt_unregister_device - remove a driver
628 * @rdi: rvt dev struct
630 void rvt_unregister_device(struct rvt_dev_info
*rdi
)
632 trace_rvt_dbg(rdi
, "Driver is unregistering.");
636 rvt_free_mad_agents(rdi
);
638 ib_unregister_device(&rdi
->ibdev
);
643 EXPORT_SYMBOL(rvt_unregister_device
);
646 * rvt_init_port - init internal data for driver port
647 * @rdi: rvt_dev_info struct
649 * @port_index: 0 based index of ports, different from IB core port num
650 * @pkey_table: pkey_table for @port
652 * Keep track of a list of ports. No need to have a detach port.
653 * They persist until the driver goes away.
657 int rvt_init_port(struct rvt_dev_info
*rdi
, struct rvt_ibport
*port
,
658 int port_index
, u16
*pkey_table
)
661 rdi
->ports
[port_index
] = port
;
662 rdi
->ports
[port_index
]->pkey_table
= pkey_table
;
666 EXPORT_SYMBOL(rvt_init_port
);