2 * Copyright (c) 2005 Ammasso, Inc. All rights reserved.
3 * Copyright (c) 2005 Open Grid Computing, Inc. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
36 #include <linux/module.h>
37 #include <linux/moduleparam.h>
38 #include <linux/pci.h>
39 #include <linux/netdevice.h>
40 #include <linux/etherdevice.h>
41 #include <linux/delay.h>
42 #include <linux/ethtool.h>
43 #include <linux/mii.h>
44 #include <linux/if_vlan.h>
45 #include <linux/crc32.h>
48 #include <linux/tcp.h>
49 #include <linux/init.h>
50 #include <linux/dma-mapping.h>
52 #include <linux/inet.h>
53 #include <linux/vmalloc.h>
54 #include <linux/slab.h>
56 #include <linux/route.h>
60 #include <asm/byteorder.h>
61 #include <rdma/ib_smi.h>
65 /* Device capabilities */
66 #define C2_MIN_PAGESIZE 1024
68 #define C2_MAX_MRS 32768
69 #define C2_MAX_QPS 16000
70 #define C2_MAX_WQE_SZ 256
71 #define C2_MAX_QP_WR ((128*1024)/C2_MAX_WQE_SZ)
73 #define C2_MAX_SGE_RD 1
74 #define C2_MAX_CQS 32768
75 #define C2_MAX_CQES 4096
76 #define C2_MAX_PDS 16384
79 * Send the adapter INIT message to the amso1100
81 static int c2_adapter_init(struct c2_dev
*c2dev
)
83 struct c2wr_init_req wr
;
86 memset(&wr
, 0, sizeof(wr
));
87 c2_wr_set_id(&wr
, CCWR_INIT
);
89 wr
.hint_count
= cpu_to_be64(c2dev
->hint_count_dma
);
90 wr
.q0_host_shared
= cpu_to_be64(c2dev
->req_vq
.shared_dma
);
91 wr
.q1_host_shared
= cpu_to_be64(c2dev
->rep_vq
.shared_dma
);
92 wr
.q1_host_msg_pool
= cpu_to_be64(c2dev
->rep_vq
.host_dma
);
93 wr
.q2_host_shared
= cpu_to_be64(c2dev
->aeq
.shared_dma
);
94 wr
.q2_host_msg_pool
= cpu_to_be64(c2dev
->aeq
.host_dma
);
96 /* Post the init message */
97 err
= vq_send_wr(c2dev
, (union c2wr
*) & wr
);
103 * Send the adapter TERM message to the amso1100
105 static void c2_adapter_term(struct c2_dev
*c2dev
)
107 struct c2wr_init_req wr
;
109 memset(&wr
, 0, sizeof(wr
));
110 c2_wr_set_id(&wr
, CCWR_TERM
);
113 /* Post the init message */
114 vq_send_wr(c2dev
, (union c2wr
*) & wr
);
123 static int c2_rnic_query(struct c2_dev
*c2dev
, struct ib_device_attr
*props
)
125 struct c2_vq_req
*vq_req
;
126 struct c2wr_rnic_query_req wr
;
127 struct c2wr_rnic_query_rep
*reply
;
130 vq_req
= vq_req_alloc(c2dev
);
134 c2_wr_set_id(&wr
, CCWR_RNIC_QUERY
);
135 wr
.hdr
.context
= (unsigned long) vq_req
;
136 wr
.rnic_handle
= c2dev
->adapter_handle
;
138 vq_req_get(c2dev
, vq_req
);
140 err
= vq_send_wr(c2dev
, (union c2wr
*) &wr
);
142 vq_req_put(c2dev
, vq_req
);
146 err
= vq_wait_for_reply(c2dev
, vq_req
);
151 (struct c2wr_rnic_query_rep
*) (unsigned long) (vq_req
->reply_msg
);
155 err
= c2_errno(reply
);
160 ((u64
)be32_to_cpu(reply
->fw_ver_major
) << 32) |
161 ((be32_to_cpu(reply
->fw_ver_minor
) & 0xFFFF) << 16) |
162 (be32_to_cpu(reply
->fw_ver_patch
) & 0xFFFF);
163 memcpy(&props
->sys_image_guid
, c2dev
->netdev
->dev_addr
, 6);
164 props
->max_mr_size
= 0xFFFFFFFF;
165 props
->page_size_cap
= ~(C2_MIN_PAGESIZE
-1);
166 props
->vendor_id
= be32_to_cpu(reply
->vendor_id
);
167 props
->vendor_part_id
= be32_to_cpu(reply
->part_number
);
168 props
->hw_ver
= be32_to_cpu(reply
->hw_version
);
169 props
->max_qp
= be32_to_cpu(reply
->max_qps
);
170 props
->max_qp_wr
= be32_to_cpu(reply
->max_qp_depth
);
171 props
->device_cap_flags
= c2dev
->device_cap_flags
;
172 props
->max_sge
= C2_MAX_SGES
;
173 props
->max_sge_rd
= C2_MAX_SGE_RD
;
174 props
->max_cq
= be32_to_cpu(reply
->max_cqs
);
175 props
->max_cqe
= be32_to_cpu(reply
->max_cq_depth
);
176 props
->max_mr
= be32_to_cpu(reply
->max_mrs
);
177 props
->max_pd
= be32_to_cpu(reply
->max_pds
);
178 props
->max_qp_rd_atom
= be32_to_cpu(reply
->max_qp_ird
);
179 props
->max_ee_rd_atom
= 0;
180 props
->max_res_rd_atom
= be32_to_cpu(reply
->max_global_ird
);
181 props
->max_qp_init_rd_atom
= be32_to_cpu(reply
->max_qp_ord
);
182 props
->max_ee_init_rd_atom
= 0;
183 props
->atomic_cap
= IB_ATOMIC_NONE
;
186 props
->max_mw
= be32_to_cpu(reply
->max_mws
);
187 props
->max_raw_ipv6_qp
= 0;
188 props
->max_raw_ethy_qp
= 0;
189 props
->max_mcast_grp
= 0;
190 props
->max_mcast_qp_attach
= 0;
191 props
->max_total_mcast_qp_attach
= 0;
194 props
->max_map_per_fmr
= 0;
196 props
->max_srq_wr
= 0;
197 props
->max_srq_sge
= 0;
198 props
->max_pkeys
= 0;
199 props
->local_ca_ack_delay
= 0;
202 vq_repbuf_free(c2dev
, reply
);
205 vq_req_free(c2dev
, vq_req
);
210 * Add an IP address to the RNIC interface
212 int c2_add_addr(struct c2_dev
*c2dev
, __be32 inaddr
, __be32 inmask
)
214 struct c2_vq_req
*vq_req
;
215 struct c2wr_rnic_setconfig_req
*wr
;
216 struct c2wr_rnic_setconfig_rep
*reply
;
217 struct c2_netaddr netaddr
;
220 vq_req
= vq_req_alloc(c2dev
);
224 len
= sizeof(struct c2_netaddr
);
225 wr
= kmalloc(c2dev
->req_vq
.msg_size
, GFP_KERNEL
);
231 c2_wr_set_id(wr
, CCWR_RNIC_SETCONFIG
);
232 wr
->hdr
.context
= (unsigned long) vq_req
;
233 wr
->rnic_handle
= c2dev
->adapter_handle
;
234 wr
->option
= cpu_to_be32(C2_CFG_ADD_ADDR
);
236 netaddr
.ip_addr
= inaddr
;
237 netaddr
.netmask
= inmask
;
240 memcpy(wr
->data
, &netaddr
, len
);
242 vq_req_get(c2dev
, vq_req
);
244 err
= vq_send_wr(c2dev
, (union c2wr
*) wr
);
246 vq_req_put(c2dev
, vq_req
);
250 err
= vq_wait_for_reply(c2dev
, vq_req
);
255 (struct c2wr_rnic_setconfig_rep
*) (unsigned long) (vq_req
->reply_msg
);
261 err
= c2_errno(reply
);
262 vq_repbuf_free(c2dev
, reply
);
267 vq_req_free(c2dev
, vq_req
);
272 * Delete an IP address from the RNIC interface
274 int c2_del_addr(struct c2_dev
*c2dev
, __be32 inaddr
, __be32 inmask
)
276 struct c2_vq_req
*vq_req
;
277 struct c2wr_rnic_setconfig_req
*wr
;
278 struct c2wr_rnic_setconfig_rep
*reply
;
279 struct c2_netaddr netaddr
;
282 vq_req
= vq_req_alloc(c2dev
);
286 len
= sizeof(struct c2_netaddr
);
287 wr
= kmalloc(c2dev
->req_vq
.msg_size
, GFP_KERNEL
);
293 c2_wr_set_id(wr
, CCWR_RNIC_SETCONFIG
);
294 wr
->hdr
.context
= (unsigned long) vq_req
;
295 wr
->rnic_handle
= c2dev
->adapter_handle
;
296 wr
->option
= cpu_to_be32(C2_CFG_DEL_ADDR
);
298 netaddr
.ip_addr
= inaddr
;
299 netaddr
.netmask
= inmask
;
302 memcpy(wr
->data
, &netaddr
, len
);
304 vq_req_get(c2dev
, vq_req
);
306 err
= vq_send_wr(c2dev
, (union c2wr
*) wr
);
308 vq_req_put(c2dev
, vq_req
);
312 err
= vq_wait_for_reply(c2dev
, vq_req
);
317 (struct c2wr_rnic_setconfig_rep
*) (unsigned long) (vq_req
->reply_msg
);
323 err
= c2_errno(reply
);
324 vq_repbuf_free(c2dev
, reply
);
329 vq_req_free(c2dev
, vq_req
);
334 * Open a single RNIC instance to use with all
335 * low level openib calls
337 static int c2_rnic_open(struct c2_dev
*c2dev
)
339 struct c2_vq_req
*vq_req
;
341 struct c2wr_rnic_open_rep
*reply
;
344 vq_req
= vq_req_alloc(c2dev
);
345 if (vq_req
== NULL
) {
349 memset(&wr
, 0, sizeof(wr
));
350 c2_wr_set_id(&wr
, CCWR_RNIC_OPEN
);
351 wr
.rnic_open
.req
.hdr
.context
= (unsigned long) (vq_req
);
352 wr
.rnic_open
.req
.flags
= cpu_to_be16(RNIC_PRIV_MODE
);
353 wr
.rnic_open
.req
.port_num
= cpu_to_be16(0);
354 wr
.rnic_open
.req
.user_context
= (unsigned long) c2dev
;
356 vq_req_get(c2dev
, vq_req
);
358 err
= vq_send_wr(c2dev
, &wr
);
360 vq_req_put(c2dev
, vq_req
);
364 err
= vq_wait_for_reply(c2dev
, vq_req
);
369 reply
= (struct c2wr_rnic_open_rep
*) (unsigned long) (vq_req
->reply_msg
);
375 if ((err
= c2_errno(reply
)) != 0) {
379 c2dev
->adapter_handle
= reply
->rnic_handle
;
382 vq_repbuf_free(c2dev
, reply
);
384 vq_req_free(c2dev
, vq_req
);
389 * Close the RNIC instance
391 static int c2_rnic_close(struct c2_dev
*c2dev
)
393 struct c2_vq_req
*vq_req
;
395 struct c2wr_rnic_close_rep
*reply
;
398 vq_req
= vq_req_alloc(c2dev
);
399 if (vq_req
== NULL
) {
403 memset(&wr
, 0, sizeof(wr
));
404 c2_wr_set_id(&wr
, CCWR_RNIC_CLOSE
);
405 wr
.rnic_close
.req
.hdr
.context
= (unsigned long) vq_req
;
406 wr
.rnic_close
.req
.rnic_handle
= c2dev
->adapter_handle
;
408 vq_req_get(c2dev
, vq_req
);
410 err
= vq_send_wr(c2dev
, &wr
);
412 vq_req_put(c2dev
, vq_req
);
416 err
= vq_wait_for_reply(c2dev
, vq_req
);
421 reply
= (struct c2wr_rnic_close_rep
*) (unsigned long) (vq_req
->reply_msg
);
427 if ((err
= c2_errno(reply
)) != 0) {
431 c2dev
->adapter_handle
= 0;
434 vq_repbuf_free(c2dev
, reply
);
436 vq_req_free(c2dev
, vq_req
);
441 * Called by c2_probe to initialize the RNIC. This principally
442 * involves initializing the various limits and resource pools that
443 * comprise the RNIC instance.
445 int c2_rnic_init(struct c2_dev
*c2dev
)
451 void __iomem
*mmio_regs
;
453 /* Device capabilities */
454 c2dev
->device_cap_flags
=
455 (IB_DEVICE_RESIZE_MAX_WR
|
456 IB_DEVICE_CURR_QP_STATE_MOD
|
457 IB_DEVICE_SYS_IMAGE_GUID
|
458 IB_DEVICE_LOCAL_DMA_LKEY
|
459 IB_DEVICE_MEM_WINDOW
);
461 /* Allocate the qptr_array */
462 c2dev
->qptr_array
= vzalloc(C2_MAX_CQS
* sizeof(void *));
463 if (!c2dev
->qptr_array
) {
467 /* Initialize the qptr_array */
468 c2dev
->qptr_array
[0] = (void *) &c2dev
->req_vq
;
469 c2dev
->qptr_array
[1] = (void *) &c2dev
->rep_vq
;
470 c2dev
->qptr_array
[2] = (void *) &c2dev
->aeq
;
472 /* Initialize data structures */
473 init_waitqueue_head(&c2dev
->req_vq_wo
);
474 spin_lock_init(&c2dev
->vqlock
);
475 spin_lock_init(&c2dev
->lock
);
477 /* Allocate MQ shared pointer pool for kernel clients. User
478 * mode client pools are hung off the user context
480 err
= c2_init_mqsp_pool(c2dev
, GFP_KERNEL
, &c2dev
->kern_mqsp_pool
);
485 /* Allocate shared pointers for Q0, Q1, and Q2 from
486 * the shared pointer pool.
489 c2dev
->hint_count
= c2_alloc_mqsp(c2dev
, c2dev
->kern_mqsp_pool
,
490 &c2dev
->hint_count_dma
,
492 c2dev
->req_vq
.shared
= c2_alloc_mqsp(c2dev
, c2dev
->kern_mqsp_pool
,
493 &c2dev
->req_vq
.shared_dma
,
495 c2dev
->rep_vq
.shared
= c2_alloc_mqsp(c2dev
, c2dev
->kern_mqsp_pool
,
496 &c2dev
->rep_vq
.shared_dma
,
498 c2dev
->aeq
.shared
= c2_alloc_mqsp(c2dev
, c2dev
->kern_mqsp_pool
,
499 &c2dev
->aeq
.shared_dma
, GFP_KERNEL
);
500 if (!c2dev
->hint_count
|| !c2dev
->req_vq
.shared
||
501 !c2dev
->rep_vq
.shared
|| !c2dev
->aeq
.shared
) {
506 mmio_regs
= c2dev
->kva
;
507 /* Initialize the Verbs Request Queue */
508 c2_mq_req_init(&c2dev
->req_vq
, 0,
509 be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q0_QSIZE
)),
510 be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q0_MSGSIZE
)),
512 be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q0_POOLSTART
)),
514 be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q0_SHARED
)),
515 C2_MQ_ADAPTER_TARGET
);
517 /* Initialize the Verbs Reply Queue */
518 qsize
= be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q1_QSIZE
));
519 msgsize
= be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q1_MSGSIZE
));
520 q1_pages
= dma_alloc_coherent(&c2dev
->pcidev
->dev
, qsize
* msgsize
,
521 &c2dev
->rep_vq
.host_dma
, GFP_KERNEL
);
526 dma_unmap_addr_set(&c2dev
->rep_vq
, mapping
, c2dev
->rep_vq
.host_dma
);
527 pr_debug("%s rep_vq va %p dma %llx\n", __func__
, q1_pages
,
528 (unsigned long long) c2dev
->rep_vq
.host_dma
);
529 c2_mq_rep_init(&c2dev
->rep_vq
,
535 be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q1_SHARED
)),
538 /* Initialize the Asynchronus Event Queue */
539 qsize
= be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q2_QSIZE
));
540 msgsize
= be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q2_MSGSIZE
));
541 q2_pages
= dma_alloc_coherent(&c2dev
->pcidev
->dev
, qsize
* msgsize
,
542 &c2dev
->aeq
.host_dma
, GFP_KERNEL
);
547 dma_unmap_addr_set(&c2dev
->aeq
, mapping
, c2dev
->aeq
.host_dma
);
548 pr_debug("%s aeq va %p dma %llx\n", __func__
, q2_pages
,
549 (unsigned long long) c2dev
->aeq
.host_dma
);
550 c2_mq_rep_init(&c2dev
->aeq
,
556 be32_to_cpu((__force __be32
) readl(mmio_regs
+ C2_REGS_Q2_SHARED
)),
559 /* Initialize the verbs request allocator */
560 err
= vq_init(c2dev
);
564 /* Enable interrupts on the adapter */
565 writel(0, c2dev
->regs
+ C2_IDIS
);
567 /* create the WR init message */
568 err
= c2_adapter_init(c2dev
);
573 /* open an adapter instance */
574 err
= c2_rnic_open(c2dev
);
578 /* Initialize cached the adapter limits */
579 if (c2_rnic_query(c2dev
, &c2dev
->props
))
582 /* Initialize the PD pool */
583 err
= c2_init_pd_table(c2dev
);
587 /* Initialize the QP pool */
588 c2_init_qp_table(c2dev
);
592 c2_rnic_close(c2dev
);
596 dma_free_coherent(&c2dev
->pcidev
->dev
,
597 c2dev
->aeq
.q_size
* c2dev
->aeq
.msg_size
,
598 q2_pages
, dma_unmap_addr(&c2dev
->aeq
, mapping
));
600 dma_free_coherent(&c2dev
->pcidev
->dev
,
601 c2dev
->rep_vq
.q_size
* c2dev
->rep_vq
.msg_size
,
602 q1_pages
, dma_unmap_addr(&c2dev
->rep_vq
, mapping
));
604 c2_free_mqsp_pool(c2dev
, c2dev
->kern_mqsp_pool
);
606 vfree(c2dev
->qptr_array
);
612 * Called by c2_remove to cleanup the RNIC resources.
614 void c2_rnic_term(struct c2_dev
*c2dev
)
617 /* Close the open adapter instance */
618 c2_rnic_close(c2dev
);
620 /* Send the TERM message to the adapter */
621 c2_adapter_term(c2dev
);
623 /* Disable interrupts on the adapter */
624 writel(1, c2dev
->regs
+ C2_IDIS
);
626 /* Free the QP pool */
627 c2_cleanup_qp_table(c2dev
);
629 /* Free the PD pool */
630 c2_cleanup_pd_table(c2dev
);
632 /* Free the verbs request allocator */
635 /* Free the asynchronus event queue */
636 dma_free_coherent(&c2dev
->pcidev
->dev
,
637 c2dev
->aeq
.q_size
* c2dev
->aeq
.msg_size
,
638 c2dev
->aeq
.msg_pool
.host
,
639 dma_unmap_addr(&c2dev
->aeq
, mapping
));
641 /* Free the verbs reply queue */
642 dma_free_coherent(&c2dev
->pcidev
->dev
,
643 c2dev
->rep_vq
.q_size
* c2dev
->rep_vq
.msg_size
,
644 c2dev
->rep_vq
.msg_pool
.host
,
645 dma_unmap_addr(&c2dev
->rep_vq
, mapping
));
647 /* Free the MQ shared pointer pool */
648 c2_free_mqsp_pool(c2dev
, c2dev
->kern_mqsp_pool
);
650 /* Free the qptr_array */
651 vfree(c2dev
->qptr_array
);