2 * Copyright (c) 2006 Chelsio, Inc. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32 #include <linux/module.h>
33 #include <linux/moduleparam.h>
34 #include <linux/device.h>
35 #include <linux/netdevice.h>
36 #include <linux/etherdevice.h>
37 #include <linux/delay.h>
38 #include <linux/errno.h>
39 #include <linux/list.h>
40 #include <linux/spinlock.h>
41 #include <linux/ethtool.h>
42 #include <linux/rtnetlink.h>
46 #include <asm/byteorder.h>
48 #include <rdma/iw_cm.h>
49 #include <rdma/ib_verbs.h>
50 #include <rdma/ib_smi.h>
51 #include <rdma/ib_umem.h>
52 #include <rdma/ib_user_verbs.h>
56 #include "iwch_provider.h"
58 #include "iwch_user.h"
60 static int iwch_modify_port(struct ib_device
*ibdev
,
61 u8 port
, int port_modify_mask
,
62 struct ib_port_modify
*props
)
67 static struct ib_ah
*iwch_ah_create(struct ib_pd
*pd
,
68 struct ib_ah_attr
*ah_attr
)
70 return ERR_PTR(-ENOSYS
);
73 static int iwch_ah_destroy(struct ib_ah
*ah
)
78 static int iwch_multicast_attach(struct ib_qp
*ibqp
, union ib_gid
*gid
, u16 lid
)
83 static int iwch_multicast_detach(struct ib_qp
*ibqp
, union ib_gid
*gid
, u16 lid
)
88 static int iwch_process_mad(struct ib_device
*ibdev
,
92 struct ib_grh
*in_grh
,
93 struct ib_mad
*in_mad
, struct ib_mad
*out_mad
)
98 static int iwch_dealloc_ucontext(struct ib_ucontext
*context
)
100 struct iwch_dev
*rhp
= to_iwch_dev(context
->device
);
101 struct iwch_ucontext
*ucontext
= to_iwch_ucontext(context
);
102 struct iwch_mm_entry
*mm
, *tmp
;
104 PDBG("%s context %p\n", __func__
, context
);
105 list_for_each_entry_safe(mm
, tmp
, &ucontext
->mmaps
, entry
)
107 cxio_release_ucontext(&rhp
->rdev
, &ucontext
->uctx
);
112 static struct ib_ucontext
*iwch_alloc_ucontext(struct ib_device
*ibdev
,
113 struct ib_udata
*udata
)
115 struct iwch_ucontext
*context
;
116 struct iwch_dev
*rhp
= to_iwch_dev(ibdev
);
118 PDBG("%s ibdev %p\n", __func__
, ibdev
);
119 context
= kzalloc(sizeof(*context
), GFP_KERNEL
);
121 return ERR_PTR(-ENOMEM
);
122 cxio_init_ucontext(&rhp
->rdev
, &context
->uctx
);
123 INIT_LIST_HEAD(&context
->mmaps
);
124 spin_lock_init(&context
->mmap_lock
);
125 return &context
->ibucontext
;
128 static int iwch_destroy_cq(struct ib_cq
*ib_cq
)
132 PDBG("%s ib_cq %p\n", __func__
, ib_cq
);
133 chp
= to_iwch_cq(ib_cq
);
135 remove_handle(chp
->rhp
, &chp
->rhp
->cqidr
, chp
->cq
.cqid
);
136 atomic_dec(&chp
->refcnt
);
137 wait_event(chp
->wait
, !atomic_read(&chp
->refcnt
));
139 cxio_destroy_cq(&chp
->rhp
->rdev
, &chp
->cq
);
144 static struct ib_cq
*iwch_create_cq(struct ib_device
*ibdev
, int entries
, int vector
,
145 struct ib_ucontext
*ib_context
,
146 struct ib_udata
*udata
)
148 struct iwch_dev
*rhp
;
150 struct iwch_create_cq_resp uresp
;
151 struct iwch_create_cq_req ureq
;
152 struct iwch_ucontext
*ucontext
= NULL
;
154 PDBG("%s ib_dev %p entries %d\n", __func__
, ibdev
, entries
);
155 rhp
= to_iwch_dev(ibdev
);
156 chp
= kzalloc(sizeof(*chp
), GFP_KERNEL
);
158 return ERR_PTR(-ENOMEM
);
161 ucontext
= to_iwch_ucontext(ib_context
);
162 if (!t3a_device(rhp
)) {
163 if (ib_copy_from_udata(&ureq
, udata
, sizeof (ureq
))) {
165 return ERR_PTR(-EFAULT
);
167 chp
->user_rptr_addr
= (u32 __user
*)(unsigned long)ureq
.user_rptr_addr
;
171 if (t3a_device(rhp
)) {
174 * T3A: Add some fluff to handle extra CQEs inserted
175 * for various errors.
176 * Additional CQE possibilities:
178 * incoming RDMA WRITE Failures
179 * incoming RDMA READ REQUEST FAILUREs
180 * NOTE: We cannot ensure the CQ won't overflow.
184 entries
= roundup_pow_of_two(entries
);
185 chp
->cq
.size_log2
= ilog2(entries
);
187 if (cxio_create_cq(&rhp
->rdev
, &chp
->cq
)) {
189 return ERR_PTR(-ENOMEM
);
192 chp
->ibcq
.cqe
= 1 << chp
->cq
.size_log2
;
193 spin_lock_init(&chp
->lock
);
194 atomic_set(&chp
->refcnt
, 1);
195 init_waitqueue_head(&chp
->wait
);
196 insert_handle(rhp
, &rhp
->cqidr
, chp
, chp
->cq
.cqid
);
199 struct iwch_mm_entry
*mm
;
201 mm
= kmalloc(sizeof *mm
, GFP_KERNEL
);
203 iwch_destroy_cq(&chp
->ibcq
);
204 return ERR_PTR(-ENOMEM
);
206 uresp
.cqid
= chp
->cq
.cqid
;
207 uresp
.size_log2
= chp
->cq
.size_log2
;
208 spin_lock(&ucontext
->mmap_lock
);
209 uresp
.key
= ucontext
->key
;
210 ucontext
->key
+= PAGE_SIZE
;
211 spin_unlock(&ucontext
->mmap_lock
);
212 if (ib_copy_to_udata(udata
, &uresp
, sizeof (uresp
))) {
214 iwch_destroy_cq(&chp
->ibcq
);
215 return ERR_PTR(-EFAULT
);
218 mm
->addr
= virt_to_phys(chp
->cq
.queue
);
219 mm
->len
= PAGE_ALIGN((1UL << uresp
.size_log2
) *
220 sizeof (struct t3_cqe
));
221 insert_mmap(ucontext
, mm
);
223 PDBG("created cqid 0x%0x chp %p size 0x%0x, dma_addr 0x%0llx\n",
224 chp
->cq
.cqid
, chp
, (1 << chp
->cq
.size_log2
),
225 (unsigned long long) chp
->cq
.dma_addr
);
229 static int iwch_resize_cq(struct ib_cq
*cq
, int cqe
, struct ib_udata
*udata
)
232 struct iwch_cq
*chp
= to_iwch_cq(cq
);
233 struct t3_cq oldcq
, newcq
;
236 PDBG("%s ib_cq %p cqe %d\n", __func__
, cq
, cqe
);
238 /* We don't downsize... */
242 /* create new t3_cq with new size */
243 cqe
= roundup_pow_of_two(cqe
+1);
244 newcq
.size_log2
= ilog2(cqe
);
246 /* Dont allow resize to less than the current wce count */
247 if (cqe
< Q_COUNT(chp
->cq
.rptr
, chp
->cq
.wptr
)) {
251 /* Quiesce all QPs using this CQ */
252 ret
= iwch_quiesce_qps(chp
);
257 ret
= cxio_create_cq(&chp
->rhp
->rdev
, &newcq
);
263 memcpy(newcq
.queue
, chp
->cq
.queue
, (1 << chp
->cq
.size_log2
) *
264 sizeof(struct t3_cqe
));
266 /* old iwch_qp gets new t3_cq but keeps old cqid */
269 chp
->cq
.cqid
= oldcq
.cqid
;
271 /* resize new t3_cq to update the HW context */
272 ret
= cxio_resize_cq(&chp
->rhp
->rdev
, &chp
->cq
);
277 chp
->ibcq
.cqe
= (1<<chp
->cq
.size_log2
) - 1;
279 /* destroy old t3_cq */
280 oldcq
.cqid
= newcq
.cqid
;
281 ret
= cxio_destroy_cq(&chp
->rhp
->rdev
, &oldcq
);
283 printk(KERN_ERR MOD
"%s - cxio_destroy_cq failed %d\n",
287 /* add user hooks here */
290 ret
= iwch_resume_qps(chp
);
297 static int iwch_arm_cq(struct ib_cq
*ibcq
, enum ib_cq_notify_flags flags
)
299 struct iwch_dev
*rhp
;
301 enum t3_cq_opcode cq_op
;
306 chp
= to_iwch_cq(ibcq
);
308 if ((flags
& IB_CQ_SOLICITED_MASK
) == IB_CQ_SOLICITED
)
312 if (chp
->user_rptr_addr
) {
313 if (get_user(rptr
, chp
->user_rptr_addr
))
315 spin_lock_irqsave(&chp
->lock
, flag
);
318 spin_lock_irqsave(&chp
->lock
, flag
);
319 PDBG("%s rptr 0x%x\n", __func__
, chp
->cq
.rptr
);
320 err
= cxio_hal_cq_op(&rhp
->rdev
, &chp
->cq
, cq_op
, 0);
321 spin_unlock_irqrestore(&chp
->lock
, flag
);
323 printk(KERN_ERR MOD
"Error %d rearming CQID 0x%x\n", err
,
325 if (err
> 0 && !(flags
& IB_CQ_REPORT_MISSED_EVENTS
))
330 static int iwch_mmap(struct ib_ucontext
*context
, struct vm_area_struct
*vma
)
332 int len
= vma
->vm_end
- vma
->vm_start
;
333 u32 key
= vma
->vm_pgoff
<< PAGE_SHIFT
;
334 struct cxio_rdev
*rdev_p
;
336 struct iwch_mm_entry
*mm
;
337 struct iwch_ucontext
*ucontext
;
340 PDBG("%s pgoff 0x%lx key 0x%x len %d\n", __func__
, vma
->vm_pgoff
,
343 if (vma
->vm_start
& (PAGE_SIZE
-1)) {
347 rdev_p
= &(to_iwch_dev(context
->device
)->rdev
);
348 ucontext
= to_iwch_ucontext(context
);
350 mm
= remove_mmap(ucontext
, key
, len
);
356 if ((addr
>= rdev_p
->rnic_info
.udbell_physbase
) &&
357 (addr
< (rdev_p
->rnic_info
.udbell_physbase
+
358 rdev_p
->rnic_info
.udbell_len
))) {
361 * Map T3 DB register.
363 if (vma
->vm_flags
& VM_READ
) {
367 vma
->vm_page_prot
= pgprot_noncached(vma
->vm_page_prot
);
368 vma
->vm_flags
|= VM_DONTCOPY
| VM_DONTEXPAND
;
369 vma
->vm_flags
&= ~VM_MAYREAD
;
370 ret
= io_remap_pfn_range(vma
, vma
->vm_start
,
372 len
, vma
->vm_page_prot
);
376 * Map WQ or CQ contig dma memory...
378 ret
= remap_pfn_range(vma
, vma
->vm_start
,
380 len
, vma
->vm_page_prot
);
386 static int iwch_deallocate_pd(struct ib_pd
*pd
)
388 struct iwch_dev
*rhp
;
391 php
= to_iwch_pd(pd
);
393 PDBG("%s ibpd %p pdid 0x%x\n", __func__
, pd
, php
->pdid
);
394 cxio_hal_put_pdid(rhp
->rdev
.rscp
, php
->pdid
);
399 static struct ib_pd
*iwch_allocate_pd(struct ib_device
*ibdev
,
400 struct ib_ucontext
*context
,
401 struct ib_udata
*udata
)
405 struct iwch_dev
*rhp
;
407 PDBG("%s ibdev %p\n", __func__
, ibdev
);
408 rhp
= (struct iwch_dev
*) ibdev
;
409 pdid
= cxio_hal_get_pdid(rhp
->rdev
.rscp
);
411 return ERR_PTR(-EINVAL
);
412 php
= kzalloc(sizeof(*php
), GFP_KERNEL
);
414 cxio_hal_put_pdid(rhp
->rdev
.rscp
, pdid
);
415 return ERR_PTR(-ENOMEM
);
420 if (ib_copy_to_udata(udata
, &php
->pdid
, sizeof (__u32
))) {
421 iwch_deallocate_pd(&php
->ibpd
);
422 return ERR_PTR(-EFAULT
);
425 PDBG("%s pdid 0x%0x ptr 0x%p\n", __func__
, pdid
, php
);
429 static int iwch_dereg_mr(struct ib_mr
*ib_mr
)
431 struct iwch_dev
*rhp
;
435 PDBG("%s ib_mr %p\n", __func__
, ib_mr
);
436 /* There can be no memory windows */
437 if (atomic_read(&ib_mr
->usecnt
))
440 mhp
= to_iwch_mr(ib_mr
);
442 mmid
= mhp
->attr
.stag
>> 8;
443 cxio_dereg_mem(&rhp
->rdev
, mhp
->attr
.stag
, mhp
->attr
.pbl_size
,
446 remove_handle(rhp
, &rhp
->mmidr
, mmid
);
448 kfree((void *) (unsigned long) mhp
->kva
);
450 ib_umem_release(mhp
->umem
);
451 PDBG("%s mmid 0x%x ptr %p\n", __func__
, mmid
, mhp
);
456 static struct ib_mr
*iwch_register_phys_mem(struct ib_pd
*pd
,
457 struct ib_phys_buf
*buffer_list
,
466 struct iwch_dev
*rhp
;
471 PDBG("%s ib_pd %p\n", __func__
, pd
);
472 php
= to_iwch_pd(pd
);
475 mhp
= kzalloc(sizeof(*mhp
), GFP_KERNEL
);
477 return ERR_PTR(-ENOMEM
);
481 /* First check that we have enough alignment */
482 if ((*iova_start
& ~PAGE_MASK
) != (buffer_list
[0].addr
& ~PAGE_MASK
)) {
487 if (num_phys_buf
> 1 &&
488 ((buffer_list
[0].addr
+ buffer_list
[0].size
) & ~PAGE_MASK
)) {
493 ret
= build_phys_page_list(buffer_list
, num_phys_buf
, iova_start
,
494 &total_size
, &npages
, &shift
, &page_list
);
498 ret
= iwch_alloc_pbl(mhp
, npages
);
504 ret
= iwch_write_pbl(mhp
, page_list
, npages
, 0);
509 mhp
->attr
.pdid
= php
->pdid
;
512 mhp
->attr
.perms
= iwch_ib_to_tpt_access(acc
);
513 mhp
->attr
.va_fbo
= *iova_start
;
514 mhp
->attr
.page_size
= shift
- 12;
516 mhp
->attr
.len
= (u32
) total_size
;
517 mhp
->attr
.pbl_size
= npages
;
518 ret
= iwch_register_mem(rhp
, php
, mhp
, shift
);
533 static int iwch_reregister_phys_mem(struct ib_mr
*mr
,
536 struct ib_phys_buf
*buffer_list
,
538 int acc
, u64
* iova_start
)
541 struct iwch_mr mh
, *mhp
;
543 struct iwch_dev
*rhp
;
544 __be64
*page_list
= NULL
;
550 PDBG("%s ib_mr %p ib_pd %p\n", __func__
, mr
, pd
);
552 /* There can be no memory windows */
553 if (atomic_read(&mr
->usecnt
))
556 mhp
= to_iwch_mr(mr
);
558 php
= to_iwch_pd(mr
->pd
);
560 /* make sure we are on the same adapter */
564 memcpy(&mh
, mhp
, sizeof *mhp
);
566 if (mr_rereg_mask
& IB_MR_REREG_PD
)
567 php
= to_iwch_pd(pd
);
568 if (mr_rereg_mask
& IB_MR_REREG_ACCESS
)
569 mh
.attr
.perms
= iwch_ib_to_tpt_access(acc
);
570 if (mr_rereg_mask
& IB_MR_REREG_TRANS
) {
571 ret
= build_phys_page_list(buffer_list
, num_phys_buf
,
573 &total_size
, &npages
,
579 ret
= iwch_reregister_mem(rhp
, php
, &mh
, shift
, npages
);
584 if (mr_rereg_mask
& IB_MR_REREG_PD
)
585 mhp
->attr
.pdid
= php
->pdid
;
586 if (mr_rereg_mask
& IB_MR_REREG_ACCESS
)
587 mhp
->attr
.perms
= iwch_ib_to_tpt_access(acc
);
588 if (mr_rereg_mask
& IB_MR_REREG_TRANS
) {
590 mhp
->attr
.va_fbo
= *iova_start
;
591 mhp
->attr
.page_size
= shift
- 12;
592 mhp
->attr
.len
= (u32
) total_size
;
593 mhp
->attr
.pbl_size
= npages
;
600 static struct ib_mr
*iwch_reg_user_mr(struct ib_pd
*pd
, u64 start
, u64 length
,
601 u64 virt
, int acc
, struct ib_udata
*udata
)
607 struct ib_umem_chunk
*chunk
;
608 struct iwch_dev
*rhp
;
611 struct iwch_reg_user_mr_resp uresp
;
613 PDBG("%s ib_pd %p\n", __func__
, pd
);
615 php
= to_iwch_pd(pd
);
617 mhp
= kzalloc(sizeof(*mhp
), GFP_KERNEL
);
619 return ERR_PTR(-ENOMEM
);
623 mhp
->umem
= ib_umem_get(pd
->uobject
->context
, start
, length
, acc
, 0);
624 if (IS_ERR(mhp
->umem
)) {
625 err
= PTR_ERR(mhp
->umem
);
630 shift
= ffs(mhp
->umem
->page_size
) - 1;
633 list_for_each_entry(chunk
, &mhp
->umem
->chunk_list
, list
)
636 err
= iwch_alloc_pbl(mhp
, n
);
640 pages
= (__be64
*) __get_free_page(GFP_KERNEL
);
648 list_for_each_entry(chunk
, &mhp
->umem
->chunk_list
, list
)
649 for (j
= 0; j
< chunk
->nmap
; ++j
) {
650 len
= sg_dma_len(&chunk
->page_list
[j
]) >> shift
;
651 for (k
= 0; k
< len
; ++k
) {
652 pages
[i
++] = cpu_to_be64(sg_dma_address(
653 &chunk
->page_list
[j
]) +
654 mhp
->umem
->page_size
* k
);
655 if (i
== PAGE_SIZE
/ sizeof *pages
) {
656 err
= iwch_write_pbl(mhp
, pages
, i
, n
);
666 err
= iwch_write_pbl(mhp
, pages
, i
, n
);
669 free_page((unsigned long) pages
);
673 mhp
->attr
.pdid
= php
->pdid
;
675 mhp
->attr
.perms
= iwch_ib_to_tpt_access(acc
);
676 mhp
->attr
.va_fbo
= virt
;
677 mhp
->attr
.page_size
= shift
- 12;
678 mhp
->attr
.len
= (u32
) length
;
680 err
= iwch_register_mem(rhp
, php
, mhp
, shift
);
684 if (udata
&& !t3a_device(rhp
)) {
685 uresp
.pbl_addr
= (mhp
->attr
.pbl_addr
-
686 rhp
->rdev
.rnic_info
.pbl_base
) >> 3;
687 PDBG("%s user resp pbl_addr 0x%x\n", __func__
,
690 if (ib_copy_to_udata(udata
, &uresp
, sizeof (uresp
))) {
691 iwch_dereg_mr(&mhp
->ibmr
);
703 ib_umem_release(mhp
->umem
);
708 static struct ib_mr
*iwch_get_dma_mr(struct ib_pd
*pd
, int acc
)
710 struct ib_phys_buf bl
;
714 PDBG("%s ib_pd %p\n", __func__
, pd
);
717 * T3 only supports 32 bits of size.
719 bl
.size
= 0xffffffff;
722 ibmr
= iwch_register_phys_mem(pd
, &bl
, 1, acc
, &kva
);
726 static struct ib_mw
*iwch_alloc_mw(struct ib_pd
*pd
)
728 struct iwch_dev
*rhp
;
735 php
= to_iwch_pd(pd
);
737 mhp
= kzalloc(sizeof(*mhp
), GFP_KERNEL
);
739 return ERR_PTR(-ENOMEM
);
740 ret
= cxio_allocate_window(&rhp
->rdev
, &stag
, php
->pdid
);
746 mhp
->attr
.pdid
= php
->pdid
;
747 mhp
->attr
.type
= TPT_MW
;
748 mhp
->attr
.stag
= stag
;
750 insert_handle(rhp
, &rhp
->mmidr
, mhp
, mmid
);
751 PDBG("%s mmid 0x%x mhp %p stag 0x%x\n", __func__
, mmid
, mhp
, stag
);
755 static int iwch_dealloc_mw(struct ib_mw
*mw
)
757 struct iwch_dev
*rhp
;
761 mhp
= to_iwch_mw(mw
);
763 mmid
= (mw
->rkey
) >> 8;
764 cxio_deallocate_window(&rhp
->rdev
, mhp
->attr
.stag
);
765 remove_handle(rhp
, &rhp
->mmidr
, mmid
);
767 PDBG("%s ib_mw %p mmid 0x%x ptr %p\n", __func__
, mw
, mmid
, mhp
);
771 static int iwch_destroy_qp(struct ib_qp
*ib_qp
)
773 struct iwch_dev
*rhp
;
775 struct iwch_qp_attributes attrs
;
776 struct iwch_ucontext
*ucontext
;
778 qhp
= to_iwch_qp(ib_qp
);
781 attrs
.next_state
= IWCH_QP_STATE_ERROR
;
782 iwch_modify_qp(rhp
, qhp
, IWCH_QP_ATTR_NEXT_STATE
, &attrs
, 0);
783 wait_event(qhp
->wait
, !qhp
->ep
);
785 remove_handle(rhp
, &rhp
->qpidr
, qhp
->wq
.qpid
);
787 atomic_dec(&qhp
->refcnt
);
788 wait_event(qhp
->wait
, !atomic_read(&qhp
->refcnt
));
790 ucontext
= ib_qp
->uobject
? to_iwch_ucontext(ib_qp
->uobject
->context
)
792 cxio_destroy_qp(&rhp
->rdev
, &qhp
->wq
,
793 ucontext
? &ucontext
->uctx
: &rhp
->rdev
.uctx
);
795 PDBG("%s ib_qp %p qpid 0x%0x qhp %p\n", __func__
,
796 ib_qp
, qhp
->wq
.qpid
, qhp
);
801 static struct ib_qp
*iwch_create_qp(struct ib_pd
*pd
,
802 struct ib_qp_init_attr
*attrs
,
803 struct ib_udata
*udata
)
805 struct iwch_dev
*rhp
;
808 struct iwch_cq
*schp
;
809 struct iwch_cq
*rchp
;
810 struct iwch_create_qp_resp uresp
;
811 int wqsize
, sqsize
, rqsize
;
812 struct iwch_ucontext
*ucontext
;
814 PDBG("%s ib_pd %p\n", __func__
, pd
);
815 if (attrs
->qp_type
!= IB_QPT_RC
)
816 return ERR_PTR(-EINVAL
);
817 php
= to_iwch_pd(pd
);
819 schp
= get_chp(rhp
, ((struct iwch_cq
*) attrs
->send_cq
)->cq
.cqid
);
820 rchp
= get_chp(rhp
, ((struct iwch_cq
*) attrs
->recv_cq
)->cq
.cqid
);
822 return ERR_PTR(-EINVAL
);
824 /* The RQT size must be # of entries + 1 rounded up to a power of two */
825 rqsize
= roundup_pow_of_two(attrs
->cap
.max_recv_wr
);
826 if (rqsize
== attrs
->cap
.max_recv_wr
)
827 rqsize
= roundup_pow_of_two(attrs
->cap
.max_recv_wr
+1);
829 /* T3 doesn't support RQT depth < 16 */
833 if (rqsize
> T3_MAX_RQ_SIZE
)
834 return ERR_PTR(-EINVAL
);
836 if (attrs
->cap
.max_inline_data
> T3_MAX_INLINE
)
837 return ERR_PTR(-EINVAL
);
840 * NOTE: The SQ and total WQ sizes don't need to be
841 * a power of two. However, all the code assumes
842 * they are. EG: Q_FREECNT() and friends.
844 sqsize
= roundup_pow_of_two(attrs
->cap
.max_send_wr
);
845 wqsize
= roundup_pow_of_two(rqsize
+ sqsize
);
846 PDBG("%s wqsize %d sqsize %d rqsize %d\n", __func__
,
847 wqsize
, sqsize
, rqsize
);
848 qhp
= kzalloc(sizeof(*qhp
), GFP_KERNEL
);
850 return ERR_PTR(-ENOMEM
);
851 qhp
->wq
.size_log2
= ilog2(wqsize
);
852 qhp
->wq
.rq_size_log2
= ilog2(rqsize
);
853 qhp
->wq
.sq_size_log2
= ilog2(sqsize
);
854 ucontext
= pd
->uobject
? to_iwch_ucontext(pd
->uobject
->context
) : NULL
;
855 if (cxio_create_qp(&rhp
->rdev
, !udata
, &qhp
->wq
,
856 ucontext
? &ucontext
->uctx
: &rhp
->rdev
.uctx
)) {
858 return ERR_PTR(-ENOMEM
);
861 attrs
->cap
.max_recv_wr
= rqsize
- 1;
862 attrs
->cap
.max_send_wr
= sqsize
;
863 attrs
->cap
.max_inline_data
= T3_MAX_INLINE
;
866 qhp
->attr
.pd
= php
->pdid
;
867 qhp
->attr
.scq
= ((struct iwch_cq
*) attrs
->send_cq
)->cq
.cqid
;
868 qhp
->attr
.rcq
= ((struct iwch_cq
*) attrs
->recv_cq
)->cq
.cqid
;
869 qhp
->attr
.sq_num_entries
= attrs
->cap
.max_send_wr
;
870 qhp
->attr
.rq_num_entries
= attrs
->cap
.max_recv_wr
;
871 qhp
->attr
.sq_max_sges
= attrs
->cap
.max_send_sge
;
872 qhp
->attr
.sq_max_sges_rdma_write
= attrs
->cap
.max_send_sge
;
873 qhp
->attr
.rq_max_sges
= attrs
->cap
.max_recv_sge
;
874 qhp
->attr
.state
= IWCH_QP_STATE_IDLE
;
875 qhp
->attr
.next_state
= IWCH_QP_STATE_IDLE
;
878 * XXX - These don't get passed in from the openib user
879 * at create time. The CM sets them via a QP modify.
880 * Need to fix... I think the CM should
882 qhp
->attr
.enable_rdma_read
= 1;
883 qhp
->attr
.enable_rdma_write
= 1;
884 qhp
->attr
.enable_bind
= 1;
885 qhp
->attr
.max_ord
= 1;
886 qhp
->attr
.max_ird
= 1;
888 spin_lock_init(&qhp
->lock
);
889 init_waitqueue_head(&qhp
->wait
);
890 atomic_set(&qhp
->refcnt
, 1);
891 insert_handle(rhp
, &rhp
->qpidr
, qhp
, qhp
->wq
.qpid
);
895 struct iwch_mm_entry
*mm1
, *mm2
;
897 mm1
= kmalloc(sizeof *mm1
, GFP_KERNEL
);
899 iwch_destroy_qp(&qhp
->ibqp
);
900 return ERR_PTR(-ENOMEM
);
903 mm2
= kmalloc(sizeof *mm2
, GFP_KERNEL
);
906 iwch_destroy_qp(&qhp
->ibqp
);
907 return ERR_PTR(-ENOMEM
);
910 uresp
.qpid
= qhp
->wq
.qpid
;
911 uresp
.size_log2
= qhp
->wq
.size_log2
;
912 uresp
.sq_size_log2
= qhp
->wq
.sq_size_log2
;
913 uresp
.rq_size_log2
= qhp
->wq
.rq_size_log2
;
914 spin_lock(&ucontext
->mmap_lock
);
915 uresp
.key
= ucontext
->key
;
916 ucontext
->key
+= PAGE_SIZE
;
917 uresp
.db_key
= ucontext
->key
;
918 ucontext
->key
+= PAGE_SIZE
;
919 spin_unlock(&ucontext
->mmap_lock
);
920 if (ib_copy_to_udata(udata
, &uresp
, sizeof (uresp
))) {
923 iwch_destroy_qp(&qhp
->ibqp
);
924 return ERR_PTR(-EFAULT
);
926 mm1
->key
= uresp
.key
;
927 mm1
->addr
= virt_to_phys(qhp
->wq
.queue
);
928 mm1
->len
= PAGE_ALIGN(wqsize
* sizeof (union t3_wr
));
929 insert_mmap(ucontext
, mm1
);
930 mm2
->key
= uresp
.db_key
;
931 mm2
->addr
= qhp
->wq
.udb
& PAGE_MASK
;
932 mm2
->len
= PAGE_SIZE
;
933 insert_mmap(ucontext
, mm2
);
935 qhp
->ibqp
.qp_num
= qhp
->wq
.qpid
;
936 init_timer(&(qhp
->timer
));
937 PDBG("%s sq_num_entries %d, rq_num_entries %d "
938 "qpid 0x%0x qhp %p dma_addr 0x%llx size %d\n",
939 __func__
, qhp
->attr
.sq_num_entries
, qhp
->attr
.rq_num_entries
,
940 qhp
->wq
.qpid
, qhp
, (unsigned long long) qhp
->wq
.dma_addr
,
941 1 << qhp
->wq
.size_log2
);
945 static int iwch_ib_modify_qp(struct ib_qp
*ibqp
, struct ib_qp_attr
*attr
,
946 int attr_mask
, struct ib_udata
*udata
)
948 struct iwch_dev
*rhp
;
950 enum iwch_qp_attr_mask mask
= 0;
951 struct iwch_qp_attributes attrs
;
953 PDBG("%s ib_qp %p\n", __func__
, ibqp
);
955 /* iwarp does not support the RTR state */
956 if ((attr_mask
& IB_QP_STATE
) && (attr
->qp_state
== IB_QPS_RTR
))
957 attr_mask
&= ~IB_QP_STATE
;
959 /* Make sure we still have something left to do */
963 memset(&attrs
, 0, sizeof attrs
);
964 qhp
= to_iwch_qp(ibqp
);
967 attrs
.next_state
= iwch_convert_state(attr
->qp_state
);
968 attrs
.enable_rdma_read
= (attr
->qp_access_flags
&
969 IB_ACCESS_REMOTE_READ
) ? 1 : 0;
970 attrs
.enable_rdma_write
= (attr
->qp_access_flags
&
971 IB_ACCESS_REMOTE_WRITE
) ? 1 : 0;
972 attrs
.enable_bind
= (attr
->qp_access_flags
& IB_ACCESS_MW_BIND
) ? 1 : 0;
975 mask
|= (attr_mask
& IB_QP_STATE
) ? IWCH_QP_ATTR_NEXT_STATE
: 0;
976 mask
|= (attr_mask
& IB_QP_ACCESS_FLAGS
) ?
977 (IWCH_QP_ATTR_ENABLE_RDMA_READ
|
978 IWCH_QP_ATTR_ENABLE_RDMA_WRITE
|
979 IWCH_QP_ATTR_ENABLE_RDMA_BIND
) : 0;
981 return iwch_modify_qp(rhp
, qhp
, mask
, &attrs
, 0);
984 void iwch_qp_add_ref(struct ib_qp
*qp
)
986 PDBG("%s ib_qp %p\n", __func__
, qp
);
987 atomic_inc(&(to_iwch_qp(qp
)->refcnt
));
990 void iwch_qp_rem_ref(struct ib_qp
*qp
)
992 PDBG("%s ib_qp %p\n", __func__
, qp
);
993 if (atomic_dec_and_test(&(to_iwch_qp(qp
)->refcnt
)))
994 wake_up(&(to_iwch_qp(qp
)->wait
));
997 static struct ib_qp
*iwch_get_qp(struct ib_device
*dev
, int qpn
)
999 PDBG("%s ib_dev %p qpn 0x%x\n", __func__
, dev
, qpn
);
1000 return (struct ib_qp
*)get_qhp(to_iwch_dev(dev
), qpn
);
1004 static int iwch_query_pkey(struct ib_device
*ibdev
,
1005 u8 port
, u16 index
, u16
* pkey
)
1007 PDBG("%s ibdev %p\n", __func__
, ibdev
);
1012 static int iwch_query_gid(struct ib_device
*ibdev
, u8 port
,
1013 int index
, union ib_gid
*gid
)
1015 struct iwch_dev
*dev
;
1017 PDBG("%s ibdev %p, port %d, index %d, gid %p\n",
1018 __func__
, ibdev
, port
, index
, gid
);
1019 dev
= to_iwch_dev(ibdev
);
1020 BUG_ON(port
== 0 || port
> 2);
1021 memset(&(gid
->raw
[0]), 0, sizeof(gid
->raw
));
1022 memcpy(&(gid
->raw
[0]), dev
->rdev
.port_info
.lldevs
[port
-1]->dev_addr
, 6);
1026 static int iwch_query_device(struct ib_device
*ibdev
,
1027 struct ib_device_attr
*props
)
1030 struct iwch_dev
*dev
;
1031 PDBG("%s ibdev %p\n", __func__
, ibdev
);
1033 dev
= to_iwch_dev(ibdev
);
1034 memset(props
, 0, sizeof *props
);
1035 memcpy(&props
->sys_image_guid
, dev
->rdev
.t3cdev_p
->lldev
->dev_addr
, 6);
1036 props
->device_cap_flags
= dev
->device_cap_flags
;
1037 props
->vendor_id
= (u32
)dev
->rdev
.rnic_info
.pdev
->vendor
;
1038 props
->vendor_part_id
= (u32
)dev
->rdev
.rnic_info
.pdev
->device
;
1039 props
->max_mr_size
= dev
->attr
.max_mr_size
;
1040 props
->max_qp
= dev
->attr
.max_qps
;
1041 props
->max_qp_wr
= dev
->attr
.max_wrs
;
1042 props
->max_sge
= dev
->attr
.max_sge_per_wr
;
1043 props
->max_sge_rd
= 1;
1044 props
->max_qp_rd_atom
= dev
->attr
.max_rdma_reads_per_qp
;
1045 props
->max_qp_init_rd_atom
= dev
->attr
.max_rdma_reads_per_qp
;
1046 props
->max_cq
= dev
->attr
.max_cqs
;
1047 props
->max_cqe
= dev
->attr
.max_cqes_per_cq
;
1048 props
->max_mr
= dev
->attr
.max_mem_regs
;
1049 props
->max_pd
= dev
->attr
.max_pds
;
1050 props
->local_ca_ack_delay
= 0;
1055 static int iwch_query_port(struct ib_device
*ibdev
,
1056 u8 port
, struct ib_port_attr
*props
)
1058 PDBG("%s ibdev %p\n", __func__
, ibdev
);
1059 props
->max_mtu
= IB_MTU_4096
;
1064 props
->state
= IB_PORT_ACTIVE
;
1065 props
->phys_state
= 0;
1066 props
->port_cap_flags
=
1068 IB_PORT_SNMP_TUNNEL_SUP
|
1069 IB_PORT_REINIT_SUP
|
1070 IB_PORT_DEVICE_MGMT_SUP
|
1071 IB_PORT_VENDOR_CLASS_SUP
| IB_PORT_BOOT_MGMT_SUP
;
1072 props
->gid_tbl_len
= 1;
1073 props
->pkey_tbl_len
= 1;
1074 props
->qkey_viol_cntr
= 0;
1075 props
->active_width
= 2;
1076 props
->active_speed
= 2;
1077 props
->max_msg_sz
= -1;
1082 static ssize_t
show_rev(struct device
*dev
, struct device_attribute
*attr
,
1085 struct iwch_dev
*iwch_dev
= container_of(dev
, struct iwch_dev
,
1087 PDBG("%s dev 0x%p\n", __func__
, dev
);
1088 return sprintf(buf
, "%d\n", iwch_dev
->rdev
.t3cdev_p
->type
);
1091 static ssize_t
show_fw_ver(struct device
*dev
, struct device_attribute
*attr
, char *buf
)
1093 struct iwch_dev
*iwch_dev
= container_of(dev
, struct iwch_dev
,
1095 struct ethtool_drvinfo info
;
1096 struct net_device
*lldev
= iwch_dev
->rdev
.t3cdev_p
->lldev
;
1098 PDBG("%s dev 0x%p\n", __func__
, dev
);
1099 lldev
->ethtool_ops
->get_drvinfo(lldev
, &info
);
1100 return sprintf(buf
, "%s\n", info
.fw_version
);
1103 static ssize_t
show_hca(struct device
*dev
, struct device_attribute
*attr
,
1106 struct iwch_dev
*iwch_dev
= container_of(dev
, struct iwch_dev
,
1108 struct ethtool_drvinfo info
;
1109 struct net_device
*lldev
= iwch_dev
->rdev
.t3cdev_p
->lldev
;
1111 PDBG("%s dev 0x%p\n", __func__
, dev
);
1112 lldev
->ethtool_ops
->get_drvinfo(lldev
, &info
);
1113 return sprintf(buf
, "%s\n", info
.driver
);
1116 static ssize_t
show_board(struct device
*dev
, struct device_attribute
*attr
,
1119 struct iwch_dev
*iwch_dev
= container_of(dev
, struct iwch_dev
,
1121 PDBG("%s dev 0x%p\n", __func__
, dev
);
1122 return sprintf(buf
, "%x.%x\n", iwch_dev
->rdev
.rnic_info
.pdev
->vendor
,
1123 iwch_dev
->rdev
.rnic_info
.pdev
->device
);
1126 static DEVICE_ATTR(hw_rev
, S_IRUGO
, show_rev
, NULL
);
1127 static DEVICE_ATTR(fw_ver
, S_IRUGO
, show_fw_ver
, NULL
);
1128 static DEVICE_ATTR(hca_type
, S_IRUGO
, show_hca
, NULL
);
1129 static DEVICE_ATTR(board_id
, S_IRUGO
, show_board
, NULL
);
1131 static struct device_attribute
*iwch_class_attributes
[] = {
1138 int iwch_register_device(struct iwch_dev
*dev
)
1143 PDBG("%s iwch_dev %p\n", __func__
, dev
);
1144 strlcpy(dev
->ibdev
.name
, "cxgb3_%d", IB_DEVICE_NAME_MAX
);
1145 memset(&dev
->ibdev
.node_guid
, 0, sizeof(dev
->ibdev
.node_guid
));
1146 memcpy(&dev
->ibdev
.node_guid
, dev
->rdev
.t3cdev_p
->lldev
->dev_addr
, 6);
1147 dev
->ibdev
.owner
= THIS_MODULE
;
1148 dev
->device_cap_flags
=
1149 (IB_DEVICE_ZERO_STAG
| IB_DEVICE_MEM_WINDOW
);
1151 dev
->ibdev
.uverbs_cmd_mask
=
1152 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT
) |
1153 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE
) |
1154 (1ull << IB_USER_VERBS_CMD_QUERY_PORT
) |
1155 (1ull << IB_USER_VERBS_CMD_ALLOC_PD
) |
1156 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD
) |
1157 (1ull << IB_USER_VERBS_CMD_REG_MR
) |
1158 (1ull << IB_USER_VERBS_CMD_DEREG_MR
) |
1159 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL
) |
1160 (1ull << IB_USER_VERBS_CMD_CREATE_CQ
) |
1161 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ
) |
1162 (1ull << IB_USER_VERBS_CMD_REQ_NOTIFY_CQ
) |
1163 (1ull << IB_USER_VERBS_CMD_CREATE_QP
) |
1164 (1ull << IB_USER_VERBS_CMD_MODIFY_QP
) |
1165 (1ull << IB_USER_VERBS_CMD_POLL_CQ
) |
1166 (1ull << IB_USER_VERBS_CMD_DESTROY_QP
) |
1167 (1ull << IB_USER_VERBS_CMD_POST_SEND
) |
1168 (1ull << IB_USER_VERBS_CMD_POST_RECV
);
1169 dev
->ibdev
.node_type
= RDMA_NODE_RNIC
;
1170 memcpy(dev
->ibdev
.node_desc
, IWCH_NODE_DESC
, sizeof(IWCH_NODE_DESC
));
1171 dev
->ibdev
.phys_port_cnt
= dev
->rdev
.port_info
.nports
;
1172 dev
->ibdev
.num_comp_vectors
= 1;
1173 dev
->ibdev
.dma_device
= &(dev
->rdev
.rnic_info
.pdev
->dev
);
1174 dev
->ibdev
.query_device
= iwch_query_device
;
1175 dev
->ibdev
.query_port
= iwch_query_port
;
1176 dev
->ibdev
.modify_port
= iwch_modify_port
;
1177 dev
->ibdev
.query_pkey
= iwch_query_pkey
;
1178 dev
->ibdev
.query_gid
= iwch_query_gid
;
1179 dev
->ibdev
.alloc_ucontext
= iwch_alloc_ucontext
;
1180 dev
->ibdev
.dealloc_ucontext
= iwch_dealloc_ucontext
;
1181 dev
->ibdev
.mmap
= iwch_mmap
;
1182 dev
->ibdev
.alloc_pd
= iwch_allocate_pd
;
1183 dev
->ibdev
.dealloc_pd
= iwch_deallocate_pd
;
1184 dev
->ibdev
.create_ah
= iwch_ah_create
;
1185 dev
->ibdev
.destroy_ah
= iwch_ah_destroy
;
1186 dev
->ibdev
.create_qp
= iwch_create_qp
;
1187 dev
->ibdev
.modify_qp
= iwch_ib_modify_qp
;
1188 dev
->ibdev
.destroy_qp
= iwch_destroy_qp
;
1189 dev
->ibdev
.create_cq
= iwch_create_cq
;
1190 dev
->ibdev
.destroy_cq
= iwch_destroy_cq
;
1191 dev
->ibdev
.resize_cq
= iwch_resize_cq
;
1192 dev
->ibdev
.poll_cq
= iwch_poll_cq
;
1193 dev
->ibdev
.get_dma_mr
= iwch_get_dma_mr
;
1194 dev
->ibdev
.reg_phys_mr
= iwch_register_phys_mem
;
1195 dev
->ibdev
.rereg_phys_mr
= iwch_reregister_phys_mem
;
1196 dev
->ibdev
.reg_user_mr
= iwch_reg_user_mr
;
1197 dev
->ibdev
.dereg_mr
= iwch_dereg_mr
;
1198 dev
->ibdev
.alloc_mw
= iwch_alloc_mw
;
1199 dev
->ibdev
.bind_mw
= iwch_bind_mw
;
1200 dev
->ibdev
.dealloc_mw
= iwch_dealloc_mw
;
1202 dev
->ibdev
.attach_mcast
= iwch_multicast_attach
;
1203 dev
->ibdev
.detach_mcast
= iwch_multicast_detach
;
1204 dev
->ibdev
.process_mad
= iwch_process_mad
;
1206 dev
->ibdev
.req_notify_cq
= iwch_arm_cq
;
1207 dev
->ibdev
.post_send
= iwch_post_send
;
1208 dev
->ibdev
.post_recv
= iwch_post_receive
;
1211 dev
->ibdev
.iwcm
= kmalloc(sizeof(struct iw_cm_verbs
), GFP_KERNEL
);
1212 if (!dev
->ibdev
.iwcm
)
1215 dev
->ibdev
.iwcm
->connect
= iwch_connect
;
1216 dev
->ibdev
.iwcm
->accept
= iwch_accept_cr
;
1217 dev
->ibdev
.iwcm
->reject
= iwch_reject_cr
;
1218 dev
->ibdev
.iwcm
->create_listen
= iwch_create_listen
;
1219 dev
->ibdev
.iwcm
->destroy_listen
= iwch_destroy_listen
;
1220 dev
->ibdev
.iwcm
->add_ref
= iwch_qp_add_ref
;
1221 dev
->ibdev
.iwcm
->rem_ref
= iwch_qp_rem_ref
;
1222 dev
->ibdev
.iwcm
->get_qp
= iwch_get_qp
;
1224 ret
= ib_register_device(&dev
->ibdev
);
1228 for (i
= 0; i
< ARRAY_SIZE(iwch_class_attributes
); ++i
) {
1229 ret
= device_create_file(&dev
->ibdev
.dev
,
1230 iwch_class_attributes
[i
]);
1237 ib_unregister_device(&dev
->ibdev
);
1242 void iwch_unregister_device(struct iwch_dev
*dev
)
1246 PDBG("%s iwch_dev %p\n", __func__
, dev
);
1247 for (i
= 0; i
< ARRAY_SIZE(iwch_class_attributes
); ++i
)
1248 device_remove_file(&dev
->ibdev
.dev
,
1249 iwch_class_attributes
[i
]);
1250 ib_unregister_device(&dev
->ibdev
);