1 /* This file is part of the Emulex RoCE Device Driver for
2 * RoCE (RDMA over Converged Ethernet) adapters.
3 * Copyright (C) 2012-2015 Emulex. All rights reserved.
4 * EMULEX and SLI are trademarks of Emulex.
7 * This software is available to you under a choice of one of two licenses.
8 * You may choose to be licensed under the terms of the GNU General Public
9 * License (GPL) Version 2, available from the file COPYING in the main
10 * directory of this source tree, or the BSD license below:
12 * Redistribution and use in source and binary forms, with or without
13 * modification, are permitted provided that the following conditions
16 * - Redistributions of source code must retain the above copyright notice,
17 * this list of conditions and the following disclaimer.
19 * - Redistributions in binary form must reproduce the above copyright
20 * notice, this list of conditions and the following disclaimer in
21 * the documentation and/or other materials provided with the distribution.
23 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
24 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
27 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
30 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
31 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
32 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
33 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
35 * Contact Information:
36 * linux-drivers@emulex.com
40 * Costa Mesa, CA 92626
43 #include <linux/dma-mapping.h>
44 #include <rdma/ib_verbs.h>
45 #include <rdma/ib_user_verbs.h>
46 #include <rdma/iw_cm.h>
47 #include <rdma/ib_umem.h>
48 #include <rdma/ib_addr.h>
49 #include <rdma/ib_cache.h>
50 #include <rdma/uverbs_ioctl.h>
53 #include "ocrdma_hw.h"
54 #include "ocrdma_verbs.h"
55 #include <rdma/ocrdma-abi.h>
57 int ocrdma_query_pkey(struct ib_device
*ibdev
, u8 port
, u16 index
, u16
*pkey
)
66 int ocrdma_query_device(struct ib_device
*ibdev
, struct ib_device_attr
*attr
,
69 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibdev
);
71 if (uhw
->inlen
|| uhw
->outlen
)
74 memset(attr
, 0, sizeof *attr
);
75 memcpy(&attr
->fw_ver
, &dev
->attr
.fw_ver
[0],
76 min(sizeof(dev
->attr
.fw_ver
), sizeof(attr
->fw_ver
)));
77 ocrdma_get_guid(dev
, (u8
*)&attr
->sys_image_guid
);
78 attr
->max_mr_size
= dev
->attr
.max_mr_size
;
79 attr
->page_size_cap
= 0xffff000;
80 attr
->vendor_id
= dev
->nic_info
.pdev
->vendor
;
81 attr
->vendor_part_id
= dev
->nic_info
.pdev
->device
;
82 attr
->hw_ver
= dev
->asic_id
;
83 attr
->max_qp
= dev
->attr
.max_qp
;
84 attr
->max_ah
= OCRDMA_MAX_AH
;
85 attr
->max_qp_wr
= dev
->attr
.max_wqe
;
87 attr
->device_cap_flags
= IB_DEVICE_CURR_QP_STATE_MOD
|
88 IB_DEVICE_RC_RNR_NAK_GEN
|
89 IB_DEVICE_SHUTDOWN_PORT
|
90 IB_DEVICE_SYS_IMAGE_GUID
|
91 IB_DEVICE_LOCAL_DMA_LKEY
|
92 IB_DEVICE_MEM_MGT_EXTENSIONS
;
93 attr
->max_send_sge
= dev
->attr
.max_send_sge
;
94 attr
->max_recv_sge
= dev
->attr
.max_recv_sge
;
95 attr
->max_sge_rd
= dev
->attr
.max_rdma_sge
;
96 attr
->max_cq
= dev
->attr
.max_cq
;
97 attr
->max_cqe
= dev
->attr
.max_cqe
;
98 attr
->max_mr
= dev
->attr
.max_mr
;
99 attr
->max_mw
= dev
->attr
.max_mw
;
100 attr
->max_pd
= dev
->attr
.max_pd
;
101 attr
->atomic_cap
= 0;
102 attr
->max_qp_rd_atom
=
103 min(dev
->attr
.max_ord_per_qp
, dev
->attr
.max_ird_per_qp
);
104 attr
->max_qp_init_rd_atom
= dev
->attr
.max_ord_per_qp
;
105 attr
->max_srq
= dev
->attr
.max_srq
;
106 attr
->max_srq_sge
= dev
->attr
.max_srq_sge
;
107 attr
->max_srq_wr
= dev
->attr
.max_rqe
;
108 attr
->local_ca_ack_delay
= dev
->attr
.local_ca_ack_delay
;
109 attr
->max_fast_reg_page_list_len
= dev
->attr
.max_pages_per_frmr
;
114 static inline void get_link_speed_and_width(struct ocrdma_dev
*dev
,
115 u16
*ib_speed
, u8
*ib_width
)
120 status
= ocrdma_mbx_get_link_speed(dev
, &speed
, NULL
);
122 speed
= OCRDMA_PHYS_LINK_SPEED_ZERO
;
125 case OCRDMA_PHYS_LINK_SPEED_1GBPS
:
126 *ib_speed
= IB_SPEED_SDR
;
127 *ib_width
= IB_WIDTH_1X
;
130 case OCRDMA_PHYS_LINK_SPEED_10GBPS
:
131 *ib_speed
= IB_SPEED_QDR
;
132 *ib_width
= IB_WIDTH_1X
;
135 case OCRDMA_PHYS_LINK_SPEED_20GBPS
:
136 *ib_speed
= IB_SPEED_DDR
;
137 *ib_width
= IB_WIDTH_4X
;
140 case OCRDMA_PHYS_LINK_SPEED_40GBPS
:
141 *ib_speed
= IB_SPEED_QDR
;
142 *ib_width
= IB_WIDTH_4X
;
147 *ib_speed
= IB_SPEED_SDR
;
148 *ib_width
= IB_WIDTH_1X
;
152 int ocrdma_query_port(struct ib_device
*ibdev
,
153 u8 port
, struct ib_port_attr
*props
)
155 enum ib_port_state port_state
;
156 struct ocrdma_dev
*dev
;
157 struct net_device
*netdev
;
159 /* props being zeroed by the caller, avoid zeroing it here */
160 dev
= get_ocrdma_dev(ibdev
);
161 netdev
= dev
->nic_info
.netdev
;
162 if (netif_running(netdev
) && netif_oper_up(netdev
)) {
163 port_state
= IB_PORT_ACTIVE
;
164 props
->phys_state
= IB_PORT_PHYS_STATE_LINK_UP
;
166 port_state
= IB_PORT_DOWN
;
167 props
->phys_state
= IB_PORT_PHYS_STATE_DISABLED
;
169 props
->max_mtu
= IB_MTU_4096
;
170 props
->active_mtu
= iboe_get_mtu(netdev
->mtu
);
175 props
->state
= port_state
;
176 props
->port_cap_flags
= IB_PORT_CM_SUP
| IB_PORT_REINIT_SUP
|
177 IB_PORT_DEVICE_MGMT_SUP
|
178 IB_PORT_VENDOR_CLASS_SUP
;
179 props
->ip_gids
= true;
180 props
->gid_tbl_len
= OCRDMA_MAX_SGID
;
181 props
->pkey_tbl_len
= 1;
182 props
->bad_pkey_cntr
= 0;
183 props
->qkey_viol_cntr
= 0;
184 get_link_speed_and_width(dev
, &props
->active_speed
,
185 &props
->active_width
);
186 props
->max_msg_sz
= 0x80000000;
187 props
->max_vl_num
= 4;
191 static int ocrdma_add_mmap(struct ocrdma_ucontext
*uctx
, u64 phy_addr
,
194 struct ocrdma_mm
*mm
;
196 mm
= kzalloc(sizeof(*mm
), GFP_KERNEL
);
199 mm
->key
.phy_addr
= phy_addr
;
201 INIT_LIST_HEAD(&mm
->entry
);
203 mutex_lock(&uctx
->mm_list_lock
);
204 list_add_tail(&mm
->entry
, &uctx
->mm_head
);
205 mutex_unlock(&uctx
->mm_list_lock
);
209 static void ocrdma_del_mmap(struct ocrdma_ucontext
*uctx
, u64 phy_addr
,
212 struct ocrdma_mm
*mm
, *tmp
;
214 mutex_lock(&uctx
->mm_list_lock
);
215 list_for_each_entry_safe(mm
, tmp
, &uctx
->mm_head
, entry
) {
216 if (len
!= mm
->key
.len
&& phy_addr
!= mm
->key
.phy_addr
)
219 list_del(&mm
->entry
);
223 mutex_unlock(&uctx
->mm_list_lock
);
226 static bool ocrdma_search_mmap(struct ocrdma_ucontext
*uctx
, u64 phy_addr
,
230 struct ocrdma_mm
*mm
;
232 mutex_lock(&uctx
->mm_list_lock
);
233 list_for_each_entry(mm
, &uctx
->mm_head
, entry
) {
234 if (len
!= mm
->key
.len
&& phy_addr
!= mm
->key
.phy_addr
)
240 mutex_unlock(&uctx
->mm_list_lock
);
245 static u16
_ocrdma_pd_mgr_get_bitmap(struct ocrdma_dev
*dev
, bool dpp_pool
)
247 u16 pd_bitmap_idx
= 0;
248 const unsigned long *pd_bitmap
;
251 pd_bitmap
= dev
->pd_mgr
->pd_dpp_bitmap
;
252 pd_bitmap_idx
= find_first_zero_bit(pd_bitmap
,
253 dev
->pd_mgr
->max_dpp_pd
);
254 __set_bit(pd_bitmap_idx
, dev
->pd_mgr
->pd_dpp_bitmap
);
255 dev
->pd_mgr
->pd_dpp_count
++;
256 if (dev
->pd_mgr
->pd_dpp_count
> dev
->pd_mgr
->pd_dpp_thrsh
)
257 dev
->pd_mgr
->pd_dpp_thrsh
= dev
->pd_mgr
->pd_dpp_count
;
259 pd_bitmap
= dev
->pd_mgr
->pd_norm_bitmap
;
260 pd_bitmap_idx
= find_first_zero_bit(pd_bitmap
,
261 dev
->pd_mgr
->max_normal_pd
);
262 __set_bit(pd_bitmap_idx
, dev
->pd_mgr
->pd_norm_bitmap
);
263 dev
->pd_mgr
->pd_norm_count
++;
264 if (dev
->pd_mgr
->pd_norm_count
> dev
->pd_mgr
->pd_norm_thrsh
)
265 dev
->pd_mgr
->pd_norm_thrsh
= dev
->pd_mgr
->pd_norm_count
;
267 return pd_bitmap_idx
;
270 static int _ocrdma_pd_mgr_put_bitmap(struct ocrdma_dev
*dev
, u16 pd_id
,
276 pd_count
= dpp_pool
? dev
->pd_mgr
->pd_dpp_count
:
277 dev
->pd_mgr
->pd_norm_count
;
282 pd_bit_index
= pd_id
- dev
->pd_mgr
->pd_dpp_start
;
283 if (pd_bit_index
>= dev
->pd_mgr
->max_dpp_pd
) {
286 __clear_bit(pd_bit_index
, dev
->pd_mgr
->pd_dpp_bitmap
);
287 dev
->pd_mgr
->pd_dpp_count
--;
290 pd_bit_index
= pd_id
- dev
->pd_mgr
->pd_norm_start
;
291 if (pd_bit_index
>= dev
->pd_mgr
->max_normal_pd
) {
294 __clear_bit(pd_bit_index
, dev
->pd_mgr
->pd_norm_bitmap
);
295 dev
->pd_mgr
->pd_norm_count
--;
302 static int ocrdma_put_pd_num(struct ocrdma_dev
*dev
, u16 pd_id
,
307 mutex_lock(&dev
->dev_lock
);
308 status
= _ocrdma_pd_mgr_put_bitmap(dev
, pd_id
, dpp_pool
);
309 mutex_unlock(&dev
->dev_lock
);
313 static int ocrdma_get_pd_num(struct ocrdma_dev
*dev
, struct ocrdma_pd
*pd
)
318 mutex_lock(&dev
->dev_lock
);
319 if (pd
->dpp_enabled
) {
320 /* try allocating DPP PD, if not available then normal PD */
321 if (dev
->pd_mgr
->pd_dpp_count
< dev
->pd_mgr
->max_dpp_pd
) {
322 pd_idx
= _ocrdma_pd_mgr_get_bitmap(dev
, true);
323 pd
->id
= dev
->pd_mgr
->pd_dpp_start
+ pd_idx
;
324 pd
->dpp_page
= dev
->pd_mgr
->dpp_page_index
+ pd_idx
;
325 } else if (dev
->pd_mgr
->pd_norm_count
<
326 dev
->pd_mgr
->max_normal_pd
) {
327 pd_idx
= _ocrdma_pd_mgr_get_bitmap(dev
, false);
328 pd
->id
= dev
->pd_mgr
->pd_norm_start
+ pd_idx
;
329 pd
->dpp_enabled
= false;
334 if (dev
->pd_mgr
->pd_norm_count
< dev
->pd_mgr
->max_normal_pd
) {
335 pd_idx
= _ocrdma_pd_mgr_get_bitmap(dev
, false);
336 pd
->id
= dev
->pd_mgr
->pd_norm_start
+ pd_idx
;
341 mutex_unlock(&dev
->dev_lock
);
348 * ocrdma_ucontext must be used here because this function is also
349 * called from ocrdma_alloc_ucontext where ib_udata does not have
350 * valid ib_ucontext pointer. ib_uverbs_get_context does not call
351 * uobj_{alloc|get_xxx} helpers which are used to store the
352 * ib_ucontext in uverbs_attr_bundle wrapping the ib_udata. so
353 * ib_udata does NOT imply valid ib_ucontext here!
355 static int _ocrdma_alloc_pd(struct ocrdma_dev
*dev
, struct ocrdma_pd
*pd
,
356 struct ocrdma_ucontext
*uctx
,
357 struct ib_udata
*udata
)
361 if (udata
&& uctx
&& dev
->attr
.max_dpp_pds
) {
363 ocrdma_get_asic_type(dev
) == OCRDMA_ASIC_GEN_SKH_R
;
365 pd
->dpp_enabled
? (dev
->nic_info
.db_page_size
/
366 dev
->attr
.wqe_size
) : 0;
369 if (dev
->pd_mgr
->pd_prealloc_valid
)
370 return ocrdma_get_pd_num(dev
, pd
);
373 status
= ocrdma_mbx_alloc_pd(dev
, pd
);
375 if (pd
->dpp_enabled
) {
376 pd
->dpp_enabled
= false;
386 static inline int is_ucontext_pd(struct ocrdma_ucontext
*uctx
,
387 struct ocrdma_pd
*pd
)
389 return (uctx
->cntxt_pd
== pd
);
392 static void _ocrdma_dealloc_pd(struct ocrdma_dev
*dev
,
393 struct ocrdma_pd
*pd
)
395 if (dev
->pd_mgr
->pd_prealloc_valid
)
396 ocrdma_put_pd_num(dev
, pd
->id
, pd
->dpp_enabled
);
398 ocrdma_mbx_dealloc_pd(dev
, pd
);
401 static int ocrdma_alloc_ucontext_pd(struct ocrdma_dev
*dev
,
402 struct ocrdma_ucontext
*uctx
,
403 struct ib_udata
*udata
)
405 struct ib_device
*ibdev
= &dev
->ibdev
;
409 pd
= rdma_zalloc_drv_obj(ibdev
, ib_pd
);
414 uctx
->cntxt_pd
= get_ocrdma_pd(pd
);
416 status
= _ocrdma_alloc_pd(dev
, uctx
->cntxt_pd
, uctx
, udata
);
418 kfree(uctx
->cntxt_pd
);
422 uctx
->cntxt_pd
->uctx
= uctx
;
423 uctx
->cntxt_pd
->ibpd
.device
= &dev
->ibdev
;
428 static void ocrdma_dealloc_ucontext_pd(struct ocrdma_ucontext
*uctx
)
430 struct ocrdma_pd
*pd
= uctx
->cntxt_pd
;
431 struct ocrdma_dev
*dev
= get_ocrdma_dev(pd
->ibpd
.device
);
433 if (uctx
->pd_in_use
) {
434 pr_err("%s(%d) Freeing in use pdid=0x%x.\n",
435 __func__
, dev
->id
, pd
->id
);
437 kfree(uctx
->cntxt_pd
);
438 uctx
->cntxt_pd
= NULL
;
439 _ocrdma_dealloc_pd(dev
, pd
);
442 static struct ocrdma_pd
*ocrdma_get_ucontext_pd(struct ocrdma_ucontext
*uctx
)
444 struct ocrdma_pd
*pd
= NULL
;
446 mutex_lock(&uctx
->mm_list_lock
);
447 if (!uctx
->pd_in_use
) {
448 uctx
->pd_in_use
= true;
451 mutex_unlock(&uctx
->mm_list_lock
);
456 static void ocrdma_release_ucontext_pd(struct ocrdma_ucontext
*uctx
)
458 mutex_lock(&uctx
->mm_list_lock
);
459 uctx
->pd_in_use
= false;
460 mutex_unlock(&uctx
->mm_list_lock
);
463 int ocrdma_alloc_ucontext(struct ib_ucontext
*uctx
, struct ib_udata
*udata
)
465 struct ib_device
*ibdev
= uctx
->device
;
467 struct ocrdma_ucontext
*ctx
= get_ocrdma_ucontext(uctx
);
468 struct ocrdma_alloc_ucontext_resp resp
= {};
469 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibdev
);
470 struct pci_dev
*pdev
= dev
->nic_info
.pdev
;
471 u32 map_len
= roundup(sizeof(u32
) * 2048, PAGE_SIZE
);
475 INIT_LIST_HEAD(&ctx
->mm_head
);
476 mutex_init(&ctx
->mm_list_lock
);
478 ctx
->ah_tbl
.va
= dma_alloc_coherent(&pdev
->dev
, map_len
,
479 &ctx
->ah_tbl
.pa
, GFP_KERNEL
);
483 ctx
->ah_tbl
.len
= map_len
;
485 resp
.ah_tbl_len
= ctx
->ah_tbl
.len
;
486 resp
.ah_tbl_page
= virt_to_phys(ctx
->ah_tbl
.va
);
488 status
= ocrdma_add_mmap(ctx
, resp
.ah_tbl_page
, resp
.ah_tbl_len
);
492 status
= ocrdma_alloc_ucontext_pd(dev
, ctx
, udata
);
496 resp
.dev_id
= dev
->id
;
497 resp
.max_inline_data
= dev
->attr
.max_inline_data
;
498 resp
.wqe_size
= dev
->attr
.wqe_size
;
499 resp
.rqe_size
= dev
->attr
.rqe_size
;
500 resp
.dpp_wqe_size
= dev
->attr
.wqe_size
;
502 memcpy(resp
.fw_ver
, dev
->attr
.fw_ver
, sizeof(resp
.fw_ver
));
503 status
= ib_copy_to_udata(udata
, &resp
, sizeof(resp
));
509 ocrdma_dealloc_ucontext_pd(ctx
);
511 ocrdma_del_mmap(ctx
, ctx
->ah_tbl
.pa
, ctx
->ah_tbl
.len
);
513 dma_free_coherent(&pdev
->dev
, ctx
->ah_tbl
.len
, ctx
->ah_tbl
.va
,
518 void ocrdma_dealloc_ucontext(struct ib_ucontext
*ibctx
)
520 struct ocrdma_mm
*mm
, *tmp
;
521 struct ocrdma_ucontext
*uctx
= get_ocrdma_ucontext(ibctx
);
522 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibctx
->device
);
523 struct pci_dev
*pdev
= dev
->nic_info
.pdev
;
525 ocrdma_dealloc_ucontext_pd(uctx
);
527 ocrdma_del_mmap(uctx
, uctx
->ah_tbl
.pa
, uctx
->ah_tbl
.len
);
528 dma_free_coherent(&pdev
->dev
, uctx
->ah_tbl
.len
, uctx
->ah_tbl
.va
,
531 list_for_each_entry_safe(mm
, tmp
, &uctx
->mm_head
, entry
) {
532 list_del(&mm
->entry
);
537 int ocrdma_mmap(struct ib_ucontext
*context
, struct vm_area_struct
*vma
)
539 struct ocrdma_ucontext
*ucontext
= get_ocrdma_ucontext(context
);
540 struct ocrdma_dev
*dev
= get_ocrdma_dev(context
->device
);
541 unsigned long vm_page
= vma
->vm_pgoff
<< PAGE_SHIFT
;
542 u64 unmapped_db
= (u64
) dev
->nic_info
.unmapped_db
;
543 unsigned long len
= (vma
->vm_end
- vma
->vm_start
);
547 if (vma
->vm_start
& (PAGE_SIZE
- 1))
549 found
= ocrdma_search_mmap(ucontext
, vma
->vm_pgoff
<< PAGE_SHIFT
, len
);
553 if ((vm_page
>= unmapped_db
) && (vm_page
<= (unmapped_db
+
554 dev
->nic_info
.db_total_size
)) &&
555 (len
<= dev
->nic_info
.db_page_size
)) {
556 if (vma
->vm_flags
& VM_READ
)
559 vma
->vm_page_prot
= pgprot_noncached(vma
->vm_page_prot
);
560 status
= io_remap_pfn_range(vma
, vma
->vm_start
, vma
->vm_pgoff
,
561 len
, vma
->vm_page_prot
);
562 } else if (dev
->nic_info
.dpp_unmapped_len
&&
563 (vm_page
>= (u64
) dev
->nic_info
.dpp_unmapped_addr
) &&
564 (vm_page
<= (u64
) (dev
->nic_info
.dpp_unmapped_addr
+
565 dev
->nic_info
.dpp_unmapped_len
)) &&
566 (len
<= dev
->nic_info
.dpp_unmapped_len
)) {
567 if (vma
->vm_flags
& VM_READ
)
570 vma
->vm_page_prot
= pgprot_writecombine(vma
->vm_page_prot
);
571 status
= io_remap_pfn_range(vma
, vma
->vm_start
, vma
->vm_pgoff
,
572 len
, vma
->vm_page_prot
);
574 status
= remap_pfn_range(vma
, vma
->vm_start
,
575 vma
->vm_pgoff
, len
, vma
->vm_page_prot
);
580 static int ocrdma_copy_pd_uresp(struct ocrdma_dev
*dev
, struct ocrdma_pd
*pd
,
581 struct ib_udata
*udata
)
585 u64 dpp_page_addr
= 0;
587 struct ocrdma_alloc_pd_uresp rsp
;
588 struct ocrdma_ucontext
*uctx
= rdma_udata_to_drv_context(
589 udata
, struct ocrdma_ucontext
, ibucontext
);
591 memset(&rsp
, 0, sizeof(rsp
));
593 rsp
.dpp_enabled
= pd
->dpp_enabled
;
594 db_page_addr
= ocrdma_get_db_addr(dev
, pd
->id
);
595 db_page_size
= dev
->nic_info
.db_page_size
;
597 status
= ocrdma_add_mmap(uctx
, db_page_addr
, db_page_size
);
601 if (pd
->dpp_enabled
) {
602 dpp_page_addr
= dev
->nic_info
.dpp_unmapped_addr
+
603 (pd
->id
* PAGE_SIZE
);
604 status
= ocrdma_add_mmap(uctx
, dpp_page_addr
,
608 rsp
.dpp_page_addr_hi
= upper_32_bits(dpp_page_addr
);
609 rsp
.dpp_page_addr_lo
= dpp_page_addr
;
612 status
= ib_copy_to_udata(udata
, &rsp
, sizeof(rsp
));
621 ocrdma_del_mmap(pd
->uctx
, dpp_page_addr
, PAGE_SIZE
);
623 ocrdma_del_mmap(pd
->uctx
, db_page_addr
, db_page_size
);
627 int ocrdma_alloc_pd(struct ib_pd
*ibpd
, struct ib_udata
*udata
)
629 struct ib_device
*ibdev
= ibpd
->device
;
630 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibdev
);
631 struct ocrdma_pd
*pd
;
633 u8 is_uctx_pd
= false;
634 struct ocrdma_ucontext
*uctx
= rdma_udata_to_drv_context(
635 udata
, struct ocrdma_ucontext
, ibucontext
);
638 pd
= ocrdma_get_ucontext_pd(uctx
);
645 pd
= get_ocrdma_pd(ibpd
);
646 status
= _ocrdma_alloc_pd(dev
, pd
, uctx
, udata
);
652 status
= ocrdma_copy_pd_uresp(dev
, pd
, udata
);
660 ocrdma_release_ucontext_pd(uctx
);
662 _ocrdma_dealloc_pd(dev
, pd
);
667 int ocrdma_dealloc_pd(struct ib_pd
*ibpd
, struct ib_udata
*udata
)
669 struct ocrdma_pd
*pd
= get_ocrdma_pd(ibpd
);
670 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibpd
->device
);
671 struct ocrdma_ucontext
*uctx
= NULL
;
676 u64 dpp_db
= dev
->nic_info
.dpp_unmapped_addr
+
677 (pd
->id
* PAGE_SIZE
);
679 ocrdma_del_mmap(pd
->uctx
, dpp_db
, PAGE_SIZE
);
680 usr_db
= ocrdma_get_db_addr(dev
, pd
->id
);
681 ocrdma_del_mmap(pd
->uctx
, usr_db
, dev
->nic_info
.db_page_size
);
683 if (is_ucontext_pd(uctx
, pd
)) {
684 ocrdma_release_ucontext_pd(uctx
);
688 _ocrdma_dealloc_pd(dev
, pd
);
692 static int ocrdma_alloc_lkey(struct ocrdma_dev
*dev
, struct ocrdma_mr
*mr
,
693 u32 pdid
, int acc
, u32 num_pbls
, u32 addr_check
)
698 mr
->hwmr
.local_rd
= 1;
699 mr
->hwmr
.remote_rd
= (acc
& IB_ACCESS_REMOTE_READ
) ? 1 : 0;
700 mr
->hwmr
.remote_wr
= (acc
& IB_ACCESS_REMOTE_WRITE
) ? 1 : 0;
701 mr
->hwmr
.local_wr
= (acc
& IB_ACCESS_LOCAL_WRITE
) ? 1 : 0;
702 mr
->hwmr
.mw_bind
= (acc
& IB_ACCESS_MW_BIND
) ? 1 : 0;
703 mr
->hwmr
.remote_atomic
= (acc
& IB_ACCESS_REMOTE_ATOMIC
) ? 1 : 0;
704 mr
->hwmr
.num_pbls
= num_pbls
;
706 status
= ocrdma_mbx_alloc_lkey(dev
, &mr
->hwmr
, pdid
, addr_check
);
710 mr
->ibmr
.lkey
= mr
->hwmr
.lkey
;
711 if (mr
->hwmr
.remote_wr
|| mr
->hwmr
.remote_rd
)
712 mr
->ibmr
.rkey
= mr
->hwmr
.lkey
;
716 struct ib_mr
*ocrdma_get_dma_mr(struct ib_pd
*ibpd
, int acc
)
719 struct ocrdma_mr
*mr
;
720 struct ocrdma_pd
*pd
= get_ocrdma_pd(ibpd
);
721 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibpd
->device
);
723 if (acc
& IB_ACCESS_REMOTE_WRITE
&& !(acc
& IB_ACCESS_LOCAL_WRITE
)) {
724 pr_err("%s err, invalid access rights\n", __func__
);
725 return ERR_PTR(-EINVAL
);
728 mr
= kzalloc(sizeof(*mr
), GFP_KERNEL
);
730 return ERR_PTR(-ENOMEM
);
732 status
= ocrdma_alloc_lkey(dev
, mr
, pd
->id
, acc
, 0,
733 OCRDMA_ADDR_CHECK_DISABLE
);
736 return ERR_PTR(status
);
742 static void ocrdma_free_mr_pbl_tbl(struct ocrdma_dev
*dev
,
743 struct ocrdma_hw_mr
*mr
)
745 struct pci_dev
*pdev
= dev
->nic_info
.pdev
;
749 for (i
= 0; i
< mr
->num_pbls
; i
++) {
750 if (!mr
->pbl_table
[i
].va
)
752 dma_free_coherent(&pdev
->dev
, mr
->pbl_size
,
754 mr
->pbl_table
[i
].pa
);
756 kfree(mr
->pbl_table
);
757 mr
->pbl_table
= NULL
;
761 static int ocrdma_get_pbl_info(struct ocrdma_dev
*dev
, struct ocrdma_mr
*mr
,
770 pbl_size
= OCRDMA_MIN_HPAGE_SIZE
* (1 << idx
);
771 if (pbl_size
> MAX_OCRDMA_PBL_SIZE
) {
775 num_pbls
= roundup(num_pbes
, (pbl_size
/ sizeof(u64
)));
776 num_pbls
= num_pbls
/ (pbl_size
/ sizeof(u64
));
778 } while (num_pbls
>= dev
->attr
.max_num_mr_pbl
);
780 mr
->hwmr
.num_pbes
= num_pbes
;
781 mr
->hwmr
.num_pbls
= num_pbls
;
782 mr
->hwmr
.pbl_size
= pbl_size
;
786 static int ocrdma_build_pbl_tbl(struct ocrdma_dev
*dev
, struct ocrdma_hw_mr
*mr
)
790 u32 dma_len
= mr
->pbl_size
;
791 struct pci_dev
*pdev
= dev
->nic_info
.pdev
;
795 mr
->pbl_table
= kcalloc(mr
->num_pbls
, sizeof(struct ocrdma_pbl
),
801 for (i
= 0; i
< mr
->num_pbls
; i
++) {
802 va
= dma_alloc_coherent(&pdev
->dev
, dma_len
, &pa
, GFP_KERNEL
);
804 ocrdma_free_mr_pbl_tbl(dev
, mr
);
808 mr
->pbl_table
[i
].va
= va
;
809 mr
->pbl_table
[i
].pa
= pa
;
814 static void build_user_pbes(struct ocrdma_dev
*dev
, struct ocrdma_mr
*mr
)
816 struct ocrdma_pbe
*pbe
;
817 struct ib_block_iter biter
;
818 struct ocrdma_pbl
*pbl_tbl
= mr
->hwmr
.pbl_table
;
822 if (!mr
->hwmr
.num_pbes
)
825 pbe
= (struct ocrdma_pbe
*)pbl_tbl
->va
;
828 rdma_umem_for_each_dma_block (mr
->umem
, &biter
, PAGE_SIZE
) {
829 /* store the page address in pbe */
830 pg_addr
= rdma_block_iter_dma_address(&biter
);
831 pbe
->pa_lo
= cpu_to_le32(pg_addr
);
832 pbe
->pa_hi
= cpu_to_le32(upper_32_bits(pg_addr
));
836 /* if the given pbl is full storing the pbes,
839 if (pbe_cnt
== (mr
->hwmr
.pbl_size
/ sizeof(u64
))) {
841 pbe
= (struct ocrdma_pbe
*)pbl_tbl
->va
;
847 struct ib_mr
*ocrdma_reg_user_mr(struct ib_pd
*ibpd
, u64 start
, u64 len
,
848 u64 usr_addr
, int acc
, struct ib_udata
*udata
)
850 int status
= -ENOMEM
;
851 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibpd
->device
);
852 struct ocrdma_mr
*mr
;
853 struct ocrdma_pd
*pd
;
855 pd
= get_ocrdma_pd(ibpd
);
857 if (acc
& IB_ACCESS_REMOTE_WRITE
&& !(acc
& IB_ACCESS_LOCAL_WRITE
))
858 return ERR_PTR(-EINVAL
);
860 mr
= kzalloc(sizeof(*mr
), GFP_KERNEL
);
862 return ERR_PTR(status
);
863 mr
->umem
= ib_umem_get(ibpd
->device
, start
, len
, acc
);
864 if (IS_ERR(mr
->umem
)) {
868 status
= ocrdma_get_pbl_info(
869 dev
, mr
, ib_umem_num_dma_blocks(mr
->umem
, PAGE_SIZE
));
873 mr
->hwmr
.pbe_size
= PAGE_SIZE
;
874 mr
->hwmr
.va
= usr_addr
;
876 mr
->hwmr
.remote_wr
= (acc
& IB_ACCESS_REMOTE_WRITE
) ? 1 : 0;
877 mr
->hwmr
.remote_rd
= (acc
& IB_ACCESS_REMOTE_READ
) ? 1 : 0;
878 mr
->hwmr
.local_wr
= (acc
& IB_ACCESS_LOCAL_WRITE
) ? 1 : 0;
879 mr
->hwmr
.local_rd
= 1;
880 mr
->hwmr
.remote_atomic
= (acc
& IB_ACCESS_REMOTE_ATOMIC
) ? 1 : 0;
881 status
= ocrdma_build_pbl_tbl(dev
, &mr
->hwmr
);
884 build_user_pbes(dev
, mr
);
885 status
= ocrdma_reg_mr(dev
, &mr
->hwmr
, pd
->id
, acc
);
888 mr
->ibmr
.lkey
= mr
->hwmr
.lkey
;
889 if (mr
->hwmr
.remote_wr
|| mr
->hwmr
.remote_rd
)
890 mr
->ibmr
.rkey
= mr
->hwmr
.lkey
;
895 ocrdma_free_mr_pbl_tbl(dev
, &mr
->hwmr
);
898 return ERR_PTR(status
);
901 int ocrdma_dereg_mr(struct ib_mr
*ib_mr
, struct ib_udata
*udata
)
903 struct ocrdma_mr
*mr
= get_ocrdma_mr(ib_mr
);
904 struct ocrdma_dev
*dev
= get_ocrdma_dev(ib_mr
->device
);
906 (void) ocrdma_mbx_dealloc_lkey(dev
, mr
->hwmr
.fr_mr
, mr
->hwmr
.lkey
);
909 ocrdma_free_mr_pbl_tbl(dev
, &mr
->hwmr
);
911 /* it could be user registered memory. */
912 ib_umem_release(mr
->umem
);
915 /* Don't stop cleanup, in case FW is unresponsive */
916 if (dev
->mqe_ctx
.fw_error_state
) {
917 pr_err("%s(%d) fw not responding.\n",
923 static int ocrdma_copy_cq_uresp(struct ocrdma_dev
*dev
, struct ocrdma_cq
*cq
,
924 struct ib_udata
*udata
)
927 struct ocrdma_ucontext
*uctx
= rdma_udata_to_drv_context(
928 udata
, struct ocrdma_ucontext
, ibucontext
);
929 struct ocrdma_create_cq_uresp uresp
;
931 /* this must be user flow! */
935 memset(&uresp
, 0, sizeof(uresp
));
936 uresp
.cq_id
= cq
->id
;
937 uresp
.page_size
= PAGE_ALIGN(cq
->len
);
939 uresp
.max_hw_cqe
= cq
->max_hw_cqe
;
940 uresp
.page_addr
[0] = virt_to_phys(cq
->va
);
941 uresp
.db_page_addr
= ocrdma_get_db_addr(dev
, uctx
->cntxt_pd
->id
);
942 uresp
.db_page_size
= dev
->nic_info
.db_page_size
;
943 uresp
.phase_change
= cq
->phase_change
? 1 : 0;
944 status
= ib_copy_to_udata(udata
, &uresp
, sizeof(uresp
));
946 pr_err("%s(%d) copy error cqid=0x%x.\n",
947 __func__
, dev
->id
, cq
->id
);
950 status
= ocrdma_add_mmap(uctx
, uresp
.db_page_addr
, uresp
.db_page_size
);
953 status
= ocrdma_add_mmap(uctx
, uresp
.page_addr
[0], uresp
.page_size
);
955 ocrdma_del_mmap(uctx
, uresp
.db_page_addr
, uresp
.db_page_size
);
963 int ocrdma_create_cq(struct ib_cq
*ibcq
, const struct ib_cq_init_attr
*attr
,
964 struct ib_udata
*udata
)
966 struct ib_device
*ibdev
= ibcq
->device
;
967 int entries
= attr
->cqe
;
968 struct ocrdma_cq
*cq
= get_ocrdma_cq(ibcq
);
969 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibdev
);
970 struct ocrdma_ucontext
*uctx
= rdma_udata_to_drv_context(
971 udata
, struct ocrdma_ucontext
, ibucontext
);
974 struct ocrdma_create_cq_ureq ureq
;
980 if (ib_copy_from_udata(&ureq
, udata
, sizeof(ureq
)))
985 spin_lock_init(&cq
->cq_lock
);
986 spin_lock_init(&cq
->comp_handler_lock
);
987 INIT_LIST_HEAD(&cq
->sq_head
);
988 INIT_LIST_HEAD(&cq
->rq_head
);
991 pd_id
= uctx
->cntxt_pd
->id
;
993 status
= ocrdma_mbx_create_cq(dev
, cq
, entries
, ureq
.dpp_cq
, pd_id
);
998 status
= ocrdma_copy_cq_uresp(dev
, cq
, udata
);
1002 cq
->phase
= OCRDMA_CQE_VALID
;
1003 dev
->cq_tbl
[cq
->id
] = cq
;
1007 ocrdma_mbx_destroy_cq(dev
, cq
);
1011 int ocrdma_resize_cq(struct ib_cq
*ibcq
, int new_cnt
,
1012 struct ib_udata
*udata
)
1015 struct ocrdma_cq
*cq
= get_ocrdma_cq(ibcq
);
1017 if (new_cnt
< 1 || new_cnt
> cq
->max_hw_cqe
) {
1021 ibcq
->cqe
= new_cnt
;
1025 static void ocrdma_flush_cq(struct ocrdma_cq
*cq
)
1028 int valid_count
= 0;
1029 unsigned long flags
;
1031 struct ocrdma_dev
*dev
= get_ocrdma_dev(cq
->ibcq
.device
);
1032 struct ocrdma_cqe
*cqe
= NULL
;
1035 cqe_cnt
= cq
->cqe_cnt
;
1037 /* Last irq might have scheduled a polling thread
1038 * sync-up with it before hard flushing.
1040 spin_lock_irqsave(&cq
->cq_lock
, flags
);
1042 if (is_cqe_valid(cq
, cqe
))
1047 ocrdma_ring_cq_db(dev
, cq
->id
, false, false, valid_count
);
1048 spin_unlock_irqrestore(&cq
->cq_lock
, flags
);
1051 int ocrdma_destroy_cq(struct ib_cq
*ibcq
, struct ib_udata
*udata
)
1053 struct ocrdma_cq
*cq
= get_ocrdma_cq(ibcq
);
1054 struct ocrdma_eq
*eq
= NULL
;
1055 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibcq
->device
);
1059 dev
->cq_tbl
[cq
->id
] = NULL
;
1060 indx
= ocrdma_get_eq_table_index(dev
, cq
->eqn
);
1062 eq
= &dev
->eq_tbl
[indx
];
1063 irq
= ocrdma_get_irq(dev
, eq
);
1064 synchronize_irq(irq
);
1065 ocrdma_flush_cq(cq
);
1067 ocrdma_mbx_destroy_cq(dev
, cq
);
1069 pdid
= cq
->ucontext
->cntxt_pd
->id
;
1070 ocrdma_del_mmap(cq
->ucontext
, (u64
) cq
->pa
,
1071 PAGE_ALIGN(cq
->len
));
1072 ocrdma_del_mmap(cq
->ucontext
,
1073 ocrdma_get_db_addr(dev
, pdid
),
1074 dev
->nic_info
.db_page_size
);
1079 static int ocrdma_add_qpn_map(struct ocrdma_dev
*dev
, struct ocrdma_qp
*qp
)
1081 int status
= -EINVAL
;
1083 if (qp
->id
< OCRDMA_MAX_QP
&& dev
->qp_tbl
[qp
->id
] == NULL
) {
1084 dev
->qp_tbl
[qp
->id
] = qp
;
1090 static void ocrdma_del_qpn_map(struct ocrdma_dev
*dev
, struct ocrdma_qp
*qp
)
1092 dev
->qp_tbl
[qp
->id
] = NULL
;
1095 static int ocrdma_check_qp_params(struct ib_pd
*ibpd
, struct ocrdma_dev
*dev
,
1096 struct ib_qp_init_attr
*attrs
,
1097 struct ib_udata
*udata
)
1099 if ((attrs
->qp_type
!= IB_QPT_GSI
) &&
1100 (attrs
->qp_type
!= IB_QPT_RC
) &&
1101 (attrs
->qp_type
!= IB_QPT_UC
) &&
1102 (attrs
->qp_type
!= IB_QPT_UD
)) {
1103 pr_err("%s(%d) unsupported qp type=0x%x requested\n",
1104 __func__
, dev
->id
, attrs
->qp_type
);
1107 /* Skip the check for QP1 to support CM size of 128 */
1108 if ((attrs
->qp_type
!= IB_QPT_GSI
) &&
1109 (attrs
->cap
.max_send_wr
> dev
->attr
.max_wqe
)) {
1110 pr_err("%s(%d) unsupported send_wr=0x%x requested\n",
1111 __func__
, dev
->id
, attrs
->cap
.max_send_wr
);
1112 pr_err("%s(%d) supported send_wr=0x%x\n",
1113 __func__
, dev
->id
, dev
->attr
.max_wqe
);
1116 if (!attrs
->srq
&& (attrs
->cap
.max_recv_wr
> dev
->attr
.max_rqe
)) {
1117 pr_err("%s(%d) unsupported recv_wr=0x%x requested\n",
1118 __func__
, dev
->id
, attrs
->cap
.max_recv_wr
);
1119 pr_err("%s(%d) supported recv_wr=0x%x\n",
1120 __func__
, dev
->id
, dev
->attr
.max_rqe
);
1123 if (attrs
->cap
.max_inline_data
> dev
->attr
.max_inline_data
) {
1124 pr_err("%s(%d) unsupported inline data size=0x%x requested\n",
1125 __func__
, dev
->id
, attrs
->cap
.max_inline_data
);
1126 pr_err("%s(%d) supported inline data size=0x%x\n",
1127 __func__
, dev
->id
, dev
->attr
.max_inline_data
);
1130 if (attrs
->cap
.max_send_sge
> dev
->attr
.max_send_sge
) {
1131 pr_err("%s(%d) unsupported send_sge=0x%x requested\n",
1132 __func__
, dev
->id
, attrs
->cap
.max_send_sge
);
1133 pr_err("%s(%d) supported send_sge=0x%x\n",
1134 __func__
, dev
->id
, dev
->attr
.max_send_sge
);
1137 if (attrs
->cap
.max_recv_sge
> dev
->attr
.max_recv_sge
) {
1138 pr_err("%s(%d) unsupported recv_sge=0x%x requested\n",
1139 __func__
, dev
->id
, attrs
->cap
.max_recv_sge
);
1140 pr_err("%s(%d) supported recv_sge=0x%x\n",
1141 __func__
, dev
->id
, dev
->attr
.max_recv_sge
);
1144 /* unprivileged user space cannot create special QP */
1145 if (udata
&& attrs
->qp_type
== IB_QPT_GSI
) {
1147 ("%s(%d) Userspace can't create special QPs of type=0x%x\n",
1148 __func__
, dev
->id
, attrs
->qp_type
);
1151 /* allow creating only one GSI type of QP */
1152 if (attrs
->qp_type
== IB_QPT_GSI
&& dev
->gsi_qp_created
) {
1153 pr_err("%s(%d) GSI special QPs already created.\n",
1157 /* verify consumer QPs are not trying to use GSI QP's CQ */
1158 if ((attrs
->qp_type
!= IB_QPT_GSI
) && (dev
->gsi_qp_created
)) {
1159 if ((dev
->gsi_sqcq
== get_ocrdma_cq(attrs
->send_cq
)) ||
1160 (dev
->gsi_rqcq
== get_ocrdma_cq(attrs
->recv_cq
))) {
1161 pr_err("%s(%d) Consumer QP cannot use GSI CQs.\n",
1169 static int ocrdma_copy_qp_uresp(struct ocrdma_qp
*qp
,
1170 struct ib_udata
*udata
, int dpp_offset
,
1171 int dpp_credit_lmt
, int srq
)
1175 struct ocrdma_create_qp_uresp uresp
;
1176 struct ocrdma_pd
*pd
= qp
->pd
;
1177 struct ocrdma_dev
*dev
= get_ocrdma_dev(pd
->ibpd
.device
);
1179 memset(&uresp
, 0, sizeof(uresp
));
1180 usr_db
= dev
->nic_info
.unmapped_db
+
1181 (pd
->id
* dev
->nic_info
.db_page_size
);
1182 uresp
.qp_id
= qp
->id
;
1183 uresp
.sq_dbid
= qp
->sq
.dbid
;
1184 uresp
.num_sq_pages
= 1;
1185 uresp
.sq_page_size
= PAGE_ALIGN(qp
->sq
.len
);
1186 uresp
.sq_page_addr
[0] = virt_to_phys(qp
->sq
.va
);
1187 uresp
.num_wqe_allocated
= qp
->sq
.max_cnt
;
1189 uresp
.rq_dbid
= qp
->rq
.dbid
;
1190 uresp
.num_rq_pages
= 1;
1191 uresp
.rq_page_size
= PAGE_ALIGN(qp
->rq
.len
);
1192 uresp
.rq_page_addr
[0] = virt_to_phys(qp
->rq
.va
);
1193 uresp
.num_rqe_allocated
= qp
->rq
.max_cnt
;
1195 uresp
.db_page_addr
= usr_db
;
1196 uresp
.db_page_size
= dev
->nic_info
.db_page_size
;
1197 uresp
.db_sq_offset
= OCRDMA_DB_GEN2_SQ_OFFSET
;
1198 uresp
.db_rq_offset
= OCRDMA_DB_GEN2_RQ_OFFSET
;
1199 uresp
.db_shift
= OCRDMA_DB_RQ_SHIFT
;
1201 if (qp
->dpp_enabled
) {
1202 uresp
.dpp_credit
= dpp_credit_lmt
;
1203 uresp
.dpp_offset
= dpp_offset
;
1205 status
= ib_copy_to_udata(udata
, &uresp
, sizeof(uresp
));
1207 pr_err("%s(%d) user copy error.\n", __func__
, dev
->id
);
1210 status
= ocrdma_add_mmap(pd
->uctx
, uresp
.sq_page_addr
[0],
1211 uresp
.sq_page_size
);
1216 status
= ocrdma_add_mmap(pd
->uctx
, uresp
.rq_page_addr
[0],
1217 uresp
.rq_page_size
);
1223 ocrdma_del_mmap(pd
->uctx
, uresp
.sq_page_addr
[0], uresp
.sq_page_size
);
1228 static void ocrdma_set_qp_db(struct ocrdma_dev
*dev
, struct ocrdma_qp
*qp
,
1229 struct ocrdma_pd
*pd
)
1231 if (ocrdma_get_asic_type(dev
) == OCRDMA_ASIC_GEN_SKH_R
) {
1232 qp
->sq_db
= dev
->nic_info
.db
+
1233 (pd
->id
* dev
->nic_info
.db_page_size
) +
1234 OCRDMA_DB_GEN2_SQ_OFFSET
;
1235 qp
->rq_db
= dev
->nic_info
.db
+
1236 (pd
->id
* dev
->nic_info
.db_page_size
) +
1237 OCRDMA_DB_GEN2_RQ_OFFSET
;
1239 qp
->sq_db
= dev
->nic_info
.db
+
1240 (pd
->id
* dev
->nic_info
.db_page_size
) +
1241 OCRDMA_DB_SQ_OFFSET
;
1242 qp
->rq_db
= dev
->nic_info
.db
+
1243 (pd
->id
* dev
->nic_info
.db_page_size
) +
1244 OCRDMA_DB_RQ_OFFSET
;
1248 static int ocrdma_alloc_wr_id_tbl(struct ocrdma_qp
*qp
)
1251 kcalloc(qp
->sq
.max_cnt
, sizeof(*(qp
->wqe_wr_id_tbl
)),
1253 if (qp
->wqe_wr_id_tbl
== NULL
)
1256 kcalloc(qp
->rq
.max_cnt
, sizeof(u64
), GFP_KERNEL
);
1257 if (qp
->rqe_wr_id_tbl
== NULL
)
1263 static void ocrdma_set_qp_init_params(struct ocrdma_qp
*qp
,
1264 struct ocrdma_pd
*pd
,
1265 struct ib_qp_init_attr
*attrs
)
1268 spin_lock_init(&qp
->q_lock
);
1269 INIT_LIST_HEAD(&qp
->sq_entry
);
1270 INIT_LIST_HEAD(&qp
->rq_entry
);
1272 qp
->qp_type
= attrs
->qp_type
;
1273 qp
->cap_flags
= OCRDMA_QP_INB_RD
| OCRDMA_QP_INB_WR
;
1274 qp
->max_inline_data
= attrs
->cap
.max_inline_data
;
1275 qp
->sq
.max_sges
= attrs
->cap
.max_send_sge
;
1276 qp
->rq
.max_sges
= attrs
->cap
.max_recv_sge
;
1277 qp
->state
= OCRDMA_QPS_RST
;
1278 qp
->signaled
= (attrs
->sq_sig_type
== IB_SIGNAL_ALL_WR
) ? true : false;
1281 static void ocrdma_store_gsi_qp_cq(struct ocrdma_dev
*dev
,
1282 struct ib_qp_init_attr
*attrs
)
1284 if (attrs
->qp_type
== IB_QPT_GSI
) {
1285 dev
->gsi_qp_created
= 1;
1286 dev
->gsi_sqcq
= get_ocrdma_cq(attrs
->send_cq
);
1287 dev
->gsi_rqcq
= get_ocrdma_cq(attrs
->recv_cq
);
1291 struct ib_qp
*ocrdma_create_qp(struct ib_pd
*ibpd
,
1292 struct ib_qp_init_attr
*attrs
,
1293 struct ib_udata
*udata
)
1296 struct ocrdma_pd
*pd
= get_ocrdma_pd(ibpd
);
1297 struct ocrdma_qp
*qp
;
1298 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibpd
->device
);
1299 struct ocrdma_create_qp_ureq ureq
;
1300 u16 dpp_credit_lmt
, dpp_offset
;
1302 if (attrs
->create_flags
)
1303 return ERR_PTR(-EOPNOTSUPP
);
1305 status
= ocrdma_check_qp_params(ibpd
, dev
, attrs
, udata
);
1309 memset(&ureq
, 0, sizeof(ureq
));
1311 if (ib_copy_from_udata(&ureq
, udata
, sizeof(ureq
)))
1312 return ERR_PTR(-EFAULT
);
1314 qp
= kzalloc(sizeof(*qp
), GFP_KERNEL
);
1319 ocrdma_set_qp_init_params(qp
, pd
, attrs
);
1321 qp
->cap_flags
|= (OCRDMA_QP_MW_BIND
| OCRDMA_QP_LKEY0
|
1322 OCRDMA_QP_FAST_REG
);
1324 mutex_lock(&dev
->dev_lock
);
1325 status
= ocrdma_mbx_create_qp(qp
, attrs
, ureq
.enable_dpp_cq
,
1327 &dpp_offset
, &dpp_credit_lmt
);
1331 /* user space QP's wr_id table are managed in library */
1332 if (udata
== NULL
) {
1333 status
= ocrdma_alloc_wr_id_tbl(qp
);
1338 status
= ocrdma_add_qpn_map(dev
, qp
);
1341 ocrdma_set_qp_db(dev
, qp
, pd
);
1343 status
= ocrdma_copy_qp_uresp(qp
, udata
, dpp_offset
,
1345 (attrs
->srq
!= NULL
));
1349 ocrdma_store_gsi_qp_cq(dev
, attrs
);
1350 qp
->ibqp
.qp_num
= qp
->id
;
1351 mutex_unlock(&dev
->dev_lock
);
1355 ocrdma_del_qpn_map(dev
, qp
);
1357 ocrdma_mbx_destroy_qp(dev
, qp
);
1359 mutex_unlock(&dev
->dev_lock
);
1360 kfree(qp
->wqe_wr_id_tbl
);
1361 kfree(qp
->rqe_wr_id_tbl
);
1363 pr_err("%s(%d) error=%d\n", __func__
, dev
->id
, status
);
1365 return ERR_PTR(status
);
1368 int _ocrdma_modify_qp(struct ib_qp
*ibqp
, struct ib_qp_attr
*attr
,
1372 struct ocrdma_qp
*qp
;
1373 struct ocrdma_dev
*dev
;
1374 enum ib_qp_state old_qps
;
1376 qp
= get_ocrdma_qp(ibqp
);
1377 dev
= get_ocrdma_dev(ibqp
->device
);
1378 if (attr_mask
& IB_QP_STATE
)
1379 status
= ocrdma_qp_state_change(qp
, attr
->qp_state
, &old_qps
);
1380 /* if new and previous states are same hw doesn't need to
1385 return ocrdma_mbx_modify_qp(dev
, qp
, attr
, attr_mask
);
1388 int ocrdma_modify_qp(struct ib_qp
*ibqp
, struct ib_qp_attr
*attr
,
1389 int attr_mask
, struct ib_udata
*udata
)
1391 unsigned long flags
;
1392 int status
= -EINVAL
;
1393 struct ocrdma_qp
*qp
;
1394 struct ocrdma_dev
*dev
;
1395 enum ib_qp_state old_qps
, new_qps
;
1397 if (attr_mask
& ~IB_QP_ATTR_STANDARD_BITS
)
1400 qp
= get_ocrdma_qp(ibqp
);
1401 dev
= get_ocrdma_dev(ibqp
->device
);
1403 /* syncronize with multiple context trying to change, retrive qps */
1404 mutex_lock(&dev
->dev_lock
);
1405 /* syncronize with wqe, rqe posting and cqe processing contexts */
1406 spin_lock_irqsave(&qp
->q_lock
, flags
);
1407 old_qps
= get_ibqp_state(qp
->state
);
1408 if (attr_mask
& IB_QP_STATE
)
1409 new_qps
= attr
->qp_state
;
1412 spin_unlock_irqrestore(&qp
->q_lock
, flags
);
1414 if (!ib_modify_qp_is_ok(old_qps
, new_qps
, ibqp
->qp_type
, attr_mask
)) {
1415 pr_err("%s(%d) invalid attribute mask=0x%x specified for\n"
1416 "qpn=0x%x of type=0x%x old_qps=0x%x, new_qps=0x%x\n",
1417 __func__
, dev
->id
, attr_mask
, qp
->id
, ibqp
->qp_type
,
1422 status
= _ocrdma_modify_qp(ibqp
, attr
, attr_mask
);
1426 mutex_unlock(&dev
->dev_lock
);
1430 static enum ib_mtu
ocrdma_mtu_int_to_enum(u16 mtu
)
1448 static int ocrdma_to_ib_qp_acc_flags(int qp_cap_flags
)
1450 int ib_qp_acc_flags
= 0;
1452 if (qp_cap_flags
& OCRDMA_QP_INB_WR
)
1453 ib_qp_acc_flags
|= IB_ACCESS_REMOTE_WRITE
;
1454 if (qp_cap_flags
& OCRDMA_QP_INB_RD
)
1455 ib_qp_acc_flags
|= IB_ACCESS_LOCAL_WRITE
;
1456 return ib_qp_acc_flags
;
1459 int ocrdma_query_qp(struct ib_qp
*ibqp
,
1460 struct ib_qp_attr
*qp_attr
,
1461 int attr_mask
, struct ib_qp_init_attr
*qp_init_attr
)
1465 struct ocrdma_qp_params params
;
1466 struct ocrdma_qp
*qp
= get_ocrdma_qp(ibqp
);
1467 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibqp
->device
);
1469 memset(¶ms
, 0, sizeof(params
));
1470 mutex_lock(&dev
->dev_lock
);
1471 status
= ocrdma_mbx_query_qp(dev
, qp
, ¶ms
);
1472 mutex_unlock(&dev
->dev_lock
);
1475 if (qp
->qp_type
== IB_QPT_UD
)
1476 qp_attr
->qkey
= params
.qkey
;
1478 ocrdma_mtu_int_to_enum(params
.path_mtu_pkey_indx
&
1479 OCRDMA_QP_PARAMS_PATH_MTU_MASK
) >>
1480 OCRDMA_QP_PARAMS_PATH_MTU_SHIFT
;
1481 qp_attr
->path_mig_state
= IB_MIG_MIGRATED
;
1482 qp_attr
->rq_psn
= params
.hop_lmt_rq_psn
& OCRDMA_QP_PARAMS_RQ_PSN_MASK
;
1483 qp_attr
->sq_psn
= params
.tclass_sq_psn
& OCRDMA_QP_PARAMS_SQ_PSN_MASK
;
1484 qp_attr
->dest_qp_num
=
1485 params
.ack_to_rnr_rtc_dest_qpn
& OCRDMA_QP_PARAMS_DEST_QPN_MASK
;
1487 qp_attr
->qp_access_flags
= ocrdma_to_ib_qp_acc_flags(qp
->cap_flags
);
1488 qp_attr
->cap
.max_send_wr
= qp
->sq
.max_cnt
- 1;
1489 qp_attr
->cap
.max_recv_wr
= qp
->rq
.max_cnt
- 1;
1490 qp_attr
->cap
.max_send_sge
= qp
->sq
.max_sges
;
1491 qp_attr
->cap
.max_recv_sge
= qp
->rq
.max_sges
;
1492 qp_attr
->cap
.max_inline_data
= qp
->max_inline_data
;
1493 qp_init_attr
->cap
= qp_attr
->cap
;
1494 qp_attr
->ah_attr
.type
= RDMA_AH_ATTR_TYPE_ROCE
;
1496 rdma_ah_set_grh(&qp_attr
->ah_attr
, NULL
,
1497 params
.rnt_rc_sl_fl
&
1498 OCRDMA_QP_PARAMS_FLOW_LABEL_MASK
,
1500 (params
.hop_lmt_rq_psn
&
1501 OCRDMA_QP_PARAMS_HOP_LMT_MASK
) >>
1502 OCRDMA_QP_PARAMS_HOP_LMT_SHIFT
,
1503 (params
.tclass_sq_psn
&
1504 OCRDMA_QP_PARAMS_TCLASS_MASK
) >>
1505 OCRDMA_QP_PARAMS_TCLASS_SHIFT
);
1506 rdma_ah_set_dgid_raw(&qp_attr
->ah_attr
, ¶ms
.dgid
[0]);
1508 rdma_ah_set_port_num(&qp_attr
->ah_attr
, 1);
1509 rdma_ah_set_sl(&qp_attr
->ah_attr
, (params
.rnt_rc_sl_fl
&
1510 OCRDMA_QP_PARAMS_SL_MASK
) >>
1511 OCRDMA_QP_PARAMS_SL_SHIFT
);
1512 qp_attr
->timeout
= (params
.ack_to_rnr_rtc_dest_qpn
&
1513 OCRDMA_QP_PARAMS_ACK_TIMEOUT_MASK
) >>
1514 OCRDMA_QP_PARAMS_ACK_TIMEOUT_SHIFT
;
1515 qp_attr
->rnr_retry
= (params
.ack_to_rnr_rtc_dest_qpn
&
1516 OCRDMA_QP_PARAMS_RNR_RETRY_CNT_MASK
) >>
1517 OCRDMA_QP_PARAMS_RNR_RETRY_CNT_SHIFT
;
1518 qp_attr
->retry_cnt
=
1519 (params
.rnt_rc_sl_fl
& OCRDMA_QP_PARAMS_RETRY_CNT_MASK
) >>
1520 OCRDMA_QP_PARAMS_RETRY_CNT_SHIFT
;
1521 qp_attr
->min_rnr_timer
= 0;
1522 qp_attr
->pkey_index
= 0;
1523 qp_attr
->port_num
= 1;
1524 rdma_ah_set_path_bits(&qp_attr
->ah_attr
, 0);
1525 rdma_ah_set_static_rate(&qp_attr
->ah_attr
, 0);
1526 qp_attr
->alt_pkey_index
= 0;
1527 qp_attr
->alt_port_num
= 0;
1528 qp_attr
->alt_timeout
= 0;
1529 memset(&qp_attr
->alt_ah_attr
, 0, sizeof(qp_attr
->alt_ah_attr
));
1530 qp_state
= (params
.max_sge_recv_flags
& OCRDMA_QP_PARAMS_STATE_MASK
) >>
1531 OCRDMA_QP_PARAMS_STATE_SHIFT
;
1532 qp_attr
->qp_state
= get_ibqp_state(qp_state
);
1533 qp_attr
->cur_qp_state
= qp_attr
->qp_state
;
1534 qp_attr
->sq_draining
= (qp_state
== OCRDMA_QPS_SQ_DRAINING
) ? 1 : 0;
1535 qp_attr
->max_dest_rd_atomic
=
1536 params
.max_ord_ird
>> OCRDMA_QP_PARAMS_MAX_ORD_SHIFT
;
1537 qp_attr
->max_rd_atomic
=
1538 params
.max_ord_ird
& OCRDMA_QP_PARAMS_MAX_IRD_MASK
;
1539 qp_attr
->en_sqd_async_notify
= (params
.max_sge_recv_flags
&
1540 OCRDMA_QP_PARAMS_FLAGS_SQD_ASYNC
) ? 1 : 0;
1541 /* Sync driver QP state with FW */
1542 ocrdma_qp_state_change(qp
, qp_attr
->qp_state
, NULL
);
1547 static void ocrdma_srq_toggle_bit(struct ocrdma_srq
*srq
, unsigned int idx
)
1549 unsigned int i
= idx
/ 32;
1550 u32 mask
= (1U << (idx
% 32));
1552 srq
->idx_bit_fields
[i
] ^= mask
;
1555 static int ocrdma_hwq_free_cnt(struct ocrdma_qp_hwq_info
*q
)
1557 return ((q
->max_wqe_idx
- q
->head
) + q
->tail
) % q
->max_cnt
;
1560 static int is_hw_sq_empty(struct ocrdma_qp
*qp
)
1562 return (qp
->sq
.tail
== qp
->sq
.head
);
1565 static int is_hw_rq_empty(struct ocrdma_qp
*qp
)
1567 return (qp
->rq
.tail
== qp
->rq
.head
);
1570 static void *ocrdma_hwq_head(struct ocrdma_qp_hwq_info
*q
)
1572 return q
->va
+ (q
->head
* q
->entry_size
);
1575 static void *ocrdma_hwq_head_from_idx(struct ocrdma_qp_hwq_info
*q
,
1578 return q
->va
+ (idx
* q
->entry_size
);
1581 static void ocrdma_hwq_inc_head(struct ocrdma_qp_hwq_info
*q
)
1583 q
->head
= (q
->head
+ 1) & q
->max_wqe_idx
;
1586 static void ocrdma_hwq_inc_tail(struct ocrdma_qp_hwq_info
*q
)
1588 q
->tail
= (q
->tail
+ 1) & q
->max_wqe_idx
;
1591 /* discard the cqe for a given QP */
1592 static void ocrdma_discard_cqes(struct ocrdma_qp
*qp
, struct ocrdma_cq
*cq
)
1594 unsigned long cq_flags
;
1595 unsigned long flags
;
1596 int discard_cnt
= 0;
1597 u32 cur_getp
, stop_getp
;
1598 struct ocrdma_cqe
*cqe
;
1599 u32 qpn
= 0, wqe_idx
= 0;
1601 spin_lock_irqsave(&cq
->cq_lock
, cq_flags
);
1603 /* traverse through the CQEs in the hw CQ,
1604 * find the matching CQE for a given qp,
1605 * mark the matching one discarded by clearing qpn.
1606 * ring the doorbell in the poll_cq() as
1607 * we don't complete out of order cqe.
1610 cur_getp
= cq
->getp
;
1611 /* find upto when do we reap the cq. */
1612 stop_getp
= cur_getp
;
1614 if (is_hw_sq_empty(qp
) && (!qp
->srq
&& is_hw_rq_empty(qp
)))
1617 cqe
= cq
->va
+ cur_getp
;
1618 /* if (a) done reaping whole hw cq, or
1619 * (b) qp_xq becomes empty.
1622 qpn
= cqe
->cmn
.qpn
& OCRDMA_CQE_QPN_MASK
;
1623 /* if previously discarded cqe found, skip that too. */
1624 /* check for matching qp */
1625 if (qpn
== 0 || qpn
!= qp
->id
)
1628 if (is_cqe_for_sq(cqe
)) {
1629 ocrdma_hwq_inc_tail(&qp
->sq
);
1632 wqe_idx
= (le32_to_cpu(cqe
->rq
.buftag_qpn
) >>
1633 OCRDMA_CQE_BUFTAG_SHIFT
) &
1634 qp
->srq
->rq
.max_wqe_idx
;
1635 BUG_ON(wqe_idx
< 1);
1636 spin_lock_irqsave(&qp
->srq
->q_lock
, flags
);
1637 ocrdma_hwq_inc_tail(&qp
->srq
->rq
);
1638 ocrdma_srq_toggle_bit(qp
->srq
, wqe_idx
- 1);
1639 spin_unlock_irqrestore(&qp
->srq
->q_lock
, flags
);
1642 ocrdma_hwq_inc_tail(&qp
->rq
);
1645 /* mark cqe discarded so that it is not picked up later
1651 cur_getp
= (cur_getp
+ 1) % cq
->max_hw_cqe
;
1652 } while (cur_getp
!= stop_getp
);
1653 spin_unlock_irqrestore(&cq
->cq_lock
, cq_flags
);
1656 void ocrdma_del_flush_qp(struct ocrdma_qp
*qp
)
1659 unsigned long flags
;
1660 struct ocrdma_dev
*dev
= get_ocrdma_dev(qp
->ibqp
.device
);
1661 /* sync with any active CQ poll */
1663 spin_lock_irqsave(&dev
->flush_q_lock
, flags
);
1664 found
= ocrdma_is_qp_in_sq_flushlist(qp
->sq_cq
, qp
);
1666 list_del(&qp
->sq_entry
);
1668 found
= ocrdma_is_qp_in_rq_flushlist(qp
->rq_cq
, qp
);
1670 list_del(&qp
->rq_entry
);
1672 spin_unlock_irqrestore(&dev
->flush_q_lock
, flags
);
1675 int ocrdma_destroy_qp(struct ib_qp
*ibqp
, struct ib_udata
*udata
)
1677 struct ocrdma_pd
*pd
;
1678 struct ocrdma_qp
*qp
;
1679 struct ocrdma_dev
*dev
;
1680 struct ib_qp_attr attrs
;
1682 unsigned long flags
;
1684 qp
= get_ocrdma_qp(ibqp
);
1685 dev
= get_ocrdma_dev(ibqp
->device
);
1689 /* change the QP state to ERROR */
1690 if (qp
->state
!= OCRDMA_QPS_RST
) {
1691 attrs
.qp_state
= IB_QPS_ERR
;
1692 attr_mask
= IB_QP_STATE
;
1693 _ocrdma_modify_qp(ibqp
, &attrs
, attr_mask
);
1695 /* ensure that CQEs for newly created QP (whose id may be same with
1696 * one which just getting destroyed are same), dont get
1697 * discarded until the old CQEs are discarded.
1699 mutex_lock(&dev
->dev_lock
);
1700 (void) ocrdma_mbx_destroy_qp(dev
, qp
);
1703 * acquire CQ lock while destroy is in progress, in order to
1704 * protect against proessing in-flight CQEs for this QP.
1706 spin_lock_irqsave(&qp
->sq_cq
->cq_lock
, flags
);
1707 if (qp
->rq_cq
&& (qp
->rq_cq
!= qp
->sq_cq
)) {
1708 spin_lock(&qp
->rq_cq
->cq_lock
);
1709 ocrdma_del_qpn_map(dev
, qp
);
1710 spin_unlock(&qp
->rq_cq
->cq_lock
);
1712 ocrdma_del_qpn_map(dev
, qp
);
1714 spin_unlock_irqrestore(&qp
->sq_cq
->cq_lock
, flags
);
1717 ocrdma_discard_cqes(qp
, qp
->sq_cq
);
1718 ocrdma_discard_cqes(qp
, qp
->rq_cq
);
1720 mutex_unlock(&dev
->dev_lock
);
1723 ocrdma_del_mmap(pd
->uctx
, (u64
) qp
->sq
.pa
,
1724 PAGE_ALIGN(qp
->sq
.len
));
1726 ocrdma_del_mmap(pd
->uctx
, (u64
) qp
->rq
.pa
,
1727 PAGE_ALIGN(qp
->rq
.len
));
1730 ocrdma_del_flush_qp(qp
);
1732 kfree(qp
->wqe_wr_id_tbl
);
1733 kfree(qp
->rqe_wr_id_tbl
);
1738 static int ocrdma_copy_srq_uresp(struct ocrdma_dev
*dev
, struct ocrdma_srq
*srq
,
1739 struct ib_udata
*udata
)
1742 struct ocrdma_create_srq_uresp uresp
;
1744 memset(&uresp
, 0, sizeof(uresp
));
1745 uresp
.rq_dbid
= srq
->rq
.dbid
;
1746 uresp
.num_rq_pages
= 1;
1747 uresp
.rq_page_addr
[0] = virt_to_phys(srq
->rq
.va
);
1748 uresp
.rq_page_size
= srq
->rq
.len
;
1749 uresp
.db_page_addr
= dev
->nic_info
.unmapped_db
+
1750 (srq
->pd
->id
* dev
->nic_info
.db_page_size
);
1751 uresp
.db_page_size
= dev
->nic_info
.db_page_size
;
1752 uresp
.num_rqe_allocated
= srq
->rq
.max_cnt
;
1753 if (ocrdma_get_asic_type(dev
) == OCRDMA_ASIC_GEN_SKH_R
) {
1754 uresp
.db_rq_offset
= OCRDMA_DB_GEN2_RQ_OFFSET
;
1755 uresp
.db_shift
= 24;
1757 uresp
.db_rq_offset
= OCRDMA_DB_RQ_OFFSET
;
1758 uresp
.db_shift
= 16;
1761 status
= ib_copy_to_udata(udata
, &uresp
, sizeof(uresp
));
1764 status
= ocrdma_add_mmap(srq
->pd
->uctx
, uresp
.rq_page_addr
[0],
1765 uresp
.rq_page_size
);
1771 int ocrdma_create_srq(struct ib_srq
*ibsrq
, struct ib_srq_init_attr
*init_attr
,
1772 struct ib_udata
*udata
)
1775 struct ocrdma_pd
*pd
= get_ocrdma_pd(ibsrq
->pd
);
1776 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibsrq
->device
);
1777 struct ocrdma_srq
*srq
= get_ocrdma_srq(ibsrq
);
1779 if (init_attr
->srq_type
!= IB_SRQT_BASIC
)
1782 if (init_attr
->attr
.max_sge
> dev
->attr
.max_recv_sge
)
1784 if (init_attr
->attr
.max_wr
> dev
->attr
.max_rqe
)
1787 spin_lock_init(&srq
->q_lock
);
1789 srq
->db
= dev
->nic_info
.db
+ (pd
->id
* dev
->nic_info
.db_page_size
);
1790 status
= ocrdma_mbx_create_srq(dev
, srq
, init_attr
, pd
);
1795 srq
->rqe_wr_id_tbl
= kcalloc(srq
->rq
.max_cnt
, sizeof(u64
),
1797 if (!srq
->rqe_wr_id_tbl
) {
1802 srq
->bit_fields_len
= (srq
->rq
.max_cnt
/ 32) +
1803 (srq
->rq
.max_cnt
% 32 ? 1 : 0);
1804 srq
->idx_bit_fields
=
1805 kmalloc_array(srq
->bit_fields_len
, sizeof(u32
),
1807 if (!srq
->idx_bit_fields
) {
1811 memset(srq
->idx_bit_fields
, 0xff,
1812 srq
->bit_fields_len
* sizeof(u32
));
1815 if (init_attr
->attr
.srq_limit
) {
1816 status
= ocrdma_mbx_modify_srq(srq
, &init_attr
->attr
);
1822 status
= ocrdma_copy_srq_uresp(dev
, srq
, udata
);
1830 ocrdma_mbx_destroy_srq(dev
, srq
);
1831 kfree(srq
->rqe_wr_id_tbl
);
1832 kfree(srq
->idx_bit_fields
);
1836 int ocrdma_modify_srq(struct ib_srq
*ibsrq
,
1837 struct ib_srq_attr
*srq_attr
,
1838 enum ib_srq_attr_mask srq_attr_mask
,
1839 struct ib_udata
*udata
)
1842 struct ocrdma_srq
*srq
;
1844 srq
= get_ocrdma_srq(ibsrq
);
1845 if (srq_attr_mask
& IB_SRQ_MAX_WR
)
1848 status
= ocrdma_mbx_modify_srq(srq
, srq_attr
);
1852 int ocrdma_query_srq(struct ib_srq
*ibsrq
, struct ib_srq_attr
*srq_attr
)
1855 struct ocrdma_srq
*srq
;
1857 srq
= get_ocrdma_srq(ibsrq
);
1858 status
= ocrdma_mbx_query_srq(srq
, srq_attr
);
1862 int ocrdma_destroy_srq(struct ib_srq
*ibsrq
, struct ib_udata
*udata
)
1864 struct ocrdma_srq
*srq
;
1865 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibsrq
->device
);
1867 srq
= get_ocrdma_srq(ibsrq
);
1869 ocrdma_mbx_destroy_srq(dev
, srq
);
1872 ocrdma_del_mmap(srq
->pd
->uctx
, (u64
) srq
->rq
.pa
,
1873 PAGE_ALIGN(srq
->rq
.len
));
1875 kfree(srq
->idx_bit_fields
);
1876 kfree(srq
->rqe_wr_id_tbl
);
1880 /* unprivileged verbs and their support functions. */
1881 static void ocrdma_build_ud_hdr(struct ocrdma_qp
*qp
,
1882 struct ocrdma_hdr_wqe
*hdr
,
1883 const struct ib_send_wr
*wr
)
1885 struct ocrdma_ewqe_ud_hdr
*ud_hdr
=
1886 (struct ocrdma_ewqe_ud_hdr
*)(hdr
+ 1);
1887 struct ocrdma_ah
*ah
= get_ocrdma_ah(ud_wr(wr
)->ah
);
1889 ud_hdr
->rsvd_dest_qpn
= ud_wr(wr
)->remote_qpn
;
1890 if (qp
->qp_type
== IB_QPT_GSI
)
1891 ud_hdr
->qkey
= qp
->qkey
;
1893 ud_hdr
->qkey
= ud_wr(wr
)->remote_qkey
;
1894 ud_hdr
->rsvd_ahid
= ah
->id
;
1895 ud_hdr
->hdr_type
= ah
->hdr_type
;
1896 if (ah
->av
->valid
& OCRDMA_AV_VLAN_VALID
)
1897 hdr
->cw
|= (OCRDMA_FLAG_AH_VLAN_PR
<< OCRDMA_WQE_FLAGS_SHIFT
);
1900 static void ocrdma_build_sges(struct ocrdma_hdr_wqe
*hdr
,
1901 struct ocrdma_sge
*sge
, int num_sge
,
1902 struct ib_sge
*sg_list
)
1906 for (i
= 0; i
< num_sge
; i
++) {
1907 sge
[i
].lrkey
= sg_list
[i
].lkey
;
1908 sge
[i
].addr_lo
= sg_list
[i
].addr
;
1909 sge
[i
].addr_hi
= upper_32_bits(sg_list
[i
].addr
);
1910 sge
[i
].len
= sg_list
[i
].length
;
1911 hdr
->total_len
+= sg_list
[i
].length
;
1914 memset(sge
, 0, sizeof(*sge
));
1917 static inline uint32_t ocrdma_sglist_len(struct ib_sge
*sg_list
, int num_sge
)
1919 uint32_t total_len
= 0, i
;
1921 for (i
= 0; i
< num_sge
; i
++)
1922 total_len
+= sg_list
[i
].length
;
1927 static int ocrdma_build_inline_sges(struct ocrdma_qp
*qp
,
1928 struct ocrdma_hdr_wqe
*hdr
,
1929 struct ocrdma_sge
*sge
,
1930 const struct ib_send_wr
*wr
, u32 wqe_size
)
1935 if (wr
->send_flags
& IB_SEND_INLINE
&& qp
->qp_type
!= IB_QPT_UD
) {
1936 hdr
->total_len
= ocrdma_sglist_len(wr
->sg_list
, wr
->num_sge
);
1937 if (unlikely(hdr
->total_len
> qp
->max_inline_data
)) {
1938 pr_err("%s() supported_len=0x%x,\n"
1939 " unsupported len req=0x%x\n", __func__
,
1940 qp
->max_inline_data
, hdr
->total_len
);
1943 dpp_addr
= (char *)sge
;
1944 for (i
= 0; i
< wr
->num_sge
; i
++) {
1946 (void *)(unsigned long)wr
->sg_list
[i
].addr
,
1947 wr
->sg_list
[i
].length
);
1948 dpp_addr
+= wr
->sg_list
[i
].length
;
1951 wqe_size
+= roundup(hdr
->total_len
, OCRDMA_WQE_ALIGN_BYTES
);
1952 if (0 == hdr
->total_len
)
1953 wqe_size
+= sizeof(struct ocrdma_sge
);
1954 hdr
->cw
|= (OCRDMA_TYPE_INLINE
<< OCRDMA_WQE_TYPE_SHIFT
);
1956 ocrdma_build_sges(hdr
, sge
, wr
->num_sge
, wr
->sg_list
);
1958 wqe_size
+= (wr
->num_sge
* sizeof(struct ocrdma_sge
));
1960 wqe_size
+= sizeof(struct ocrdma_sge
);
1961 hdr
->cw
|= (OCRDMA_TYPE_LKEY
<< OCRDMA_WQE_TYPE_SHIFT
);
1963 hdr
->cw
|= ((wqe_size
/ OCRDMA_WQE_STRIDE
) << OCRDMA_WQE_SIZE_SHIFT
);
1967 static int ocrdma_build_send(struct ocrdma_qp
*qp
, struct ocrdma_hdr_wqe
*hdr
,
1968 const struct ib_send_wr
*wr
)
1971 struct ocrdma_sge
*sge
;
1972 u32 wqe_size
= sizeof(*hdr
);
1974 if (qp
->qp_type
== IB_QPT_UD
|| qp
->qp_type
== IB_QPT_GSI
) {
1975 ocrdma_build_ud_hdr(qp
, hdr
, wr
);
1976 sge
= (struct ocrdma_sge
*)(hdr
+ 2);
1977 wqe_size
+= sizeof(struct ocrdma_ewqe_ud_hdr
);
1979 sge
= (struct ocrdma_sge
*)(hdr
+ 1);
1982 status
= ocrdma_build_inline_sges(qp
, hdr
, sge
, wr
, wqe_size
);
1986 static int ocrdma_build_write(struct ocrdma_qp
*qp
, struct ocrdma_hdr_wqe
*hdr
,
1987 const struct ib_send_wr
*wr
)
1990 struct ocrdma_sge
*ext_rw
= (struct ocrdma_sge
*)(hdr
+ 1);
1991 struct ocrdma_sge
*sge
= ext_rw
+ 1;
1992 u32 wqe_size
= sizeof(*hdr
) + sizeof(*ext_rw
);
1994 status
= ocrdma_build_inline_sges(qp
, hdr
, sge
, wr
, wqe_size
);
1997 ext_rw
->addr_lo
= rdma_wr(wr
)->remote_addr
;
1998 ext_rw
->addr_hi
= upper_32_bits(rdma_wr(wr
)->remote_addr
);
1999 ext_rw
->lrkey
= rdma_wr(wr
)->rkey
;
2000 ext_rw
->len
= hdr
->total_len
;
2004 static void ocrdma_build_read(struct ocrdma_qp
*qp
, struct ocrdma_hdr_wqe
*hdr
,
2005 const struct ib_send_wr
*wr
)
2007 struct ocrdma_sge
*ext_rw
= (struct ocrdma_sge
*)(hdr
+ 1);
2008 struct ocrdma_sge
*sge
= ext_rw
+ 1;
2009 u32 wqe_size
= ((wr
->num_sge
+ 1) * sizeof(struct ocrdma_sge
)) +
2010 sizeof(struct ocrdma_hdr_wqe
);
2012 ocrdma_build_sges(hdr
, sge
, wr
->num_sge
, wr
->sg_list
);
2013 hdr
->cw
|= ((wqe_size
/ OCRDMA_WQE_STRIDE
) << OCRDMA_WQE_SIZE_SHIFT
);
2014 hdr
->cw
|= (OCRDMA_READ
<< OCRDMA_WQE_OPCODE_SHIFT
);
2015 hdr
->cw
|= (OCRDMA_TYPE_LKEY
<< OCRDMA_WQE_TYPE_SHIFT
);
2017 ext_rw
->addr_lo
= rdma_wr(wr
)->remote_addr
;
2018 ext_rw
->addr_hi
= upper_32_bits(rdma_wr(wr
)->remote_addr
);
2019 ext_rw
->lrkey
= rdma_wr(wr
)->rkey
;
2020 ext_rw
->len
= hdr
->total_len
;
2023 static int get_encoded_page_size(int pg_sz
)
2025 /* Max size is 256M 4096 << 16 */
2028 if (pg_sz
== (4096 << i
))
2033 static int ocrdma_build_reg(struct ocrdma_qp
*qp
,
2034 struct ocrdma_hdr_wqe
*hdr
,
2035 const struct ib_reg_wr
*wr
)
2038 struct ocrdma_ewqe_fr
*fast_reg
= (struct ocrdma_ewqe_fr
*)(hdr
+ 1);
2039 struct ocrdma_mr
*mr
= get_ocrdma_mr(wr
->mr
);
2040 struct ocrdma_pbl
*pbl_tbl
= mr
->hwmr
.pbl_table
;
2041 struct ocrdma_pbe
*pbe
;
2042 u32 wqe_size
= sizeof(*fast_reg
) + sizeof(*hdr
);
2043 int num_pbes
= 0, i
;
2045 wqe_size
= roundup(wqe_size
, OCRDMA_WQE_ALIGN_BYTES
);
2047 hdr
->cw
|= (OCRDMA_FR_MR
<< OCRDMA_WQE_OPCODE_SHIFT
);
2048 hdr
->cw
|= ((wqe_size
/ OCRDMA_WQE_STRIDE
) << OCRDMA_WQE_SIZE_SHIFT
);
2050 if (wr
->access
& IB_ACCESS_LOCAL_WRITE
)
2051 hdr
->rsvd_lkey_flags
|= OCRDMA_LKEY_FLAG_LOCAL_WR
;
2052 if (wr
->access
& IB_ACCESS_REMOTE_WRITE
)
2053 hdr
->rsvd_lkey_flags
|= OCRDMA_LKEY_FLAG_REMOTE_WR
;
2054 if (wr
->access
& IB_ACCESS_REMOTE_READ
)
2055 hdr
->rsvd_lkey_flags
|= OCRDMA_LKEY_FLAG_REMOTE_RD
;
2056 hdr
->lkey
= wr
->key
;
2057 hdr
->total_len
= mr
->ibmr
.length
;
2059 fbo
= mr
->ibmr
.iova
- mr
->pages
[0];
2061 fast_reg
->va_hi
= upper_32_bits(mr
->ibmr
.iova
);
2062 fast_reg
->va_lo
= (u32
) (mr
->ibmr
.iova
& 0xffffffff);
2063 fast_reg
->fbo_hi
= upper_32_bits(fbo
);
2064 fast_reg
->fbo_lo
= (u32
) fbo
& 0xffffffff;
2065 fast_reg
->num_sges
= mr
->npages
;
2066 fast_reg
->size_sge
= get_encoded_page_size(mr
->ibmr
.page_size
);
2069 for (i
= 0; i
< mr
->npages
; i
++) {
2070 u64 buf_addr
= mr
->pages
[i
];
2072 pbe
->pa_lo
= cpu_to_le32((u32
) (buf_addr
& PAGE_MASK
));
2073 pbe
->pa_hi
= cpu_to_le32((u32
) upper_32_bits(buf_addr
));
2077 /* if the pbl is full storing the pbes,
2080 if (num_pbes
== (mr
->hwmr
.pbl_size
/sizeof(u64
))) {
2082 pbe
= (struct ocrdma_pbe
*)pbl_tbl
->va
;
2089 static void ocrdma_ring_sq_db(struct ocrdma_qp
*qp
)
2091 u32 val
= qp
->sq
.dbid
| (1 << OCRDMA_DB_SQ_SHIFT
);
2093 iowrite32(val
, qp
->sq_db
);
2096 int ocrdma_post_send(struct ib_qp
*ibqp
, const struct ib_send_wr
*wr
,
2097 const struct ib_send_wr
**bad_wr
)
2100 struct ocrdma_qp
*qp
= get_ocrdma_qp(ibqp
);
2101 struct ocrdma_hdr_wqe
*hdr
;
2102 unsigned long flags
;
2104 spin_lock_irqsave(&qp
->q_lock
, flags
);
2105 if (qp
->state
!= OCRDMA_QPS_RTS
&& qp
->state
!= OCRDMA_QPS_SQD
) {
2106 spin_unlock_irqrestore(&qp
->q_lock
, flags
);
2112 if (qp
->qp_type
== IB_QPT_UD
&&
2113 (wr
->opcode
!= IB_WR_SEND
&&
2114 wr
->opcode
!= IB_WR_SEND_WITH_IMM
)) {
2119 if (ocrdma_hwq_free_cnt(&qp
->sq
) == 0 ||
2120 wr
->num_sge
> qp
->sq
.max_sges
) {
2125 hdr
= ocrdma_hwq_head(&qp
->sq
);
2127 if (wr
->send_flags
& IB_SEND_SIGNALED
|| qp
->signaled
)
2128 hdr
->cw
|= (OCRDMA_FLAG_SIG
<< OCRDMA_WQE_FLAGS_SHIFT
);
2129 if (wr
->send_flags
& IB_SEND_FENCE
)
2131 (OCRDMA_FLAG_FENCE_L
<< OCRDMA_WQE_FLAGS_SHIFT
);
2132 if (wr
->send_flags
& IB_SEND_SOLICITED
)
2134 (OCRDMA_FLAG_SOLICIT
<< OCRDMA_WQE_FLAGS_SHIFT
);
2136 switch (wr
->opcode
) {
2137 case IB_WR_SEND_WITH_IMM
:
2138 hdr
->cw
|= (OCRDMA_FLAG_IMM
<< OCRDMA_WQE_FLAGS_SHIFT
);
2139 hdr
->immdt
= ntohl(wr
->ex
.imm_data
);
2142 hdr
->cw
|= (OCRDMA_SEND
<< OCRDMA_WQE_OPCODE_SHIFT
);
2143 ocrdma_build_send(qp
, hdr
, wr
);
2145 case IB_WR_SEND_WITH_INV
:
2146 hdr
->cw
|= (OCRDMA_FLAG_INV
<< OCRDMA_WQE_FLAGS_SHIFT
);
2147 hdr
->cw
|= (OCRDMA_SEND
<< OCRDMA_WQE_OPCODE_SHIFT
);
2148 hdr
->lkey
= wr
->ex
.invalidate_rkey
;
2149 status
= ocrdma_build_send(qp
, hdr
, wr
);
2151 case IB_WR_RDMA_WRITE_WITH_IMM
:
2152 hdr
->cw
|= (OCRDMA_FLAG_IMM
<< OCRDMA_WQE_FLAGS_SHIFT
);
2153 hdr
->immdt
= ntohl(wr
->ex
.imm_data
);
2155 case IB_WR_RDMA_WRITE
:
2156 hdr
->cw
|= (OCRDMA_WRITE
<< OCRDMA_WQE_OPCODE_SHIFT
);
2157 status
= ocrdma_build_write(qp
, hdr
, wr
);
2159 case IB_WR_RDMA_READ
:
2160 ocrdma_build_read(qp
, hdr
, wr
);
2162 case IB_WR_LOCAL_INV
:
2164 (OCRDMA_LKEY_INV
<< OCRDMA_WQE_OPCODE_SHIFT
);
2165 hdr
->cw
|= ((sizeof(struct ocrdma_hdr_wqe
) +
2166 sizeof(struct ocrdma_sge
)) /
2167 OCRDMA_WQE_STRIDE
) << OCRDMA_WQE_SIZE_SHIFT
;
2168 hdr
->lkey
= wr
->ex
.invalidate_rkey
;
2171 status
= ocrdma_build_reg(qp
, hdr
, reg_wr(wr
));
2181 if (wr
->send_flags
& IB_SEND_SIGNALED
|| qp
->signaled
)
2182 qp
->wqe_wr_id_tbl
[qp
->sq
.head
].signaled
= 1;
2184 qp
->wqe_wr_id_tbl
[qp
->sq
.head
].signaled
= 0;
2185 qp
->wqe_wr_id_tbl
[qp
->sq
.head
].wrid
= wr
->wr_id
;
2186 ocrdma_cpu_to_le32(hdr
, ((hdr
->cw
>> OCRDMA_WQE_SIZE_SHIFT
) &
2187 OCRDMA_WQE_SIZE_MASK
) * OCRDMA_WQE_STRIDE
);
2188 /* make sure wqe is written before adapter can access it */
2190 /* inform hw to start processing it */
2191 ocrdma_ring_sq_db(qp
);
2193 /* update pointer, counter for next wr */
2194 ocrdma_hwq_inc_head(&qp
->sq
);
2197 spin_unlock_irqrestore(&qp
->q_lock
, flags
);
2201 static void ocrdma_ring_rq_db(struct ocrdma_qp
*qp
)
2203 u32 val
= qp
->rq
.dbid
| (1 << OCRDMA_DB_RQ_SHIFT
);
2205 iowrite32(val
, qp
->rq_db
);
2208 static void ocrdma_build_rqe(struct ocrdma_hdr_wqe
*rqe
,
2209 const struct ib_recv_wr
*wr
, u16 tag
)
2212 struct ocrdma_sge
*sge
;
2214 wqe_size
= (wr
->num_sge
* sizeof(*sge
)) + sizeof(*rqe
);
2216 wqe_size
= sizeof(*sge
) + sizeof(*rqe
);
2218 rqe
->cw
= ((wqe_size
/ OCRDMA_WQE_STRIDE
) <<
2219 OCRDMA_WQE_SIZE_SHIFT
);
2220 rqe
->cw
|= (OCRDMA_FLAG_SIG
<< OCRDMA_WQE_FLAGS_SHIFT
);
2221 rqe
->cw
|= (OCRDMA_TYPE_LKEY
<< OCRDMA_WQE_TYPE_SHIFT
);
2223 rqe
->rsvd_tag
= tag
;
2224 sge
= (struct ocrdma_sge
*)(rqe
+ 1);
2225 ocrdma_build_sges(rqe
, sge
, wr
->num_sge
, wr
->sg_list
);
2226 ocrdma_cpu_to_le32(rqe
, wqe_size
);
2229 int ocrdma_post_recv(struct ib_qp
*ibqp
, const struct ib_recv_wr
*wr
,
2230 const struct ib_recv_wr
**bad_wr
)
2233 unsigned long flags
;
2234 struct ocrdma_qp
*qp
= get_ocrdma_qp(ibqp
);
2235 struct ocrdma_hdr_wqe
*rqe
;
2237 spin_lock_irqsave(&qp
->q_lock
, flags
);
2238 if (qp
->state
== OCRDMA_QPS_RST
|| qp
->state
== OCRDMA_QPS_ERR
) {
2239 spin_unlock_irqrestore(&qp
->q_lock
, flags
);
2244 if (ocrdma_hwq_free_cnt(&qp
->rq
) == 0 ||
2245 wr
->num_sge
> qp
->rq
.max_sges
) {
2250 rqe
= ocrdma_hwq_head(&qp
->rq
);
2251 ocrdma_build_rqe(rqe
, wr
, 0);
2253 qp
->rqe_wr_id_tbl
[qp
->rq
.head
] = wr
->wr_id
;
2254 /* make sure rqe is written before adapter can access it */
2257 /* inform hw to start processing it */
2258 ocrdma_ring_rq_db(qp
);
2260 /* update pointer, counter for next wr */
2261 ocrdma_hwq_inc_head(&qp
->rq
);
2264 spin_unlock_irqrestore(&qp
->q_lock
, flags
);
2268 /* cqe for srq's rqe can potentially arrive out of order.
2269 * index gives the entry in the shadow table where to store
2270 * the wr_id. tag/index is returned in cqe to reference back
2273 static int ocrdma_srq_get_idx(struct ocrdma_srq
*srq
)
2278 for (row
= 0; row
< srq
->bit_fields_len
; row
++) {
2279 if (srq
->idx_bit_fields
[row
]) {
2280 indx
= ffs(srq
->idx_bit_fields
[row
]);
2281 indx
= (row
* 32) + (indx
- 1);
2282 BUG_ON(indx
>= srq
->rq
.max_cnt
);
2283 ocrdma_srq_toggle_bit(srq
, indx
);
2288 BUG_ON(row
== srq
->bit_fields_len
);
2289 return indx
+ 1; /* Use from index 1 */
2292 static void ocrdma_ring_srq_db(struct ocrdma_srq
*srq
)
2294 u32 val
= srq
->rq
.dbid
| (1 << 16);
2296 iowrite32(val
, srq
->db
+ OCRDMA_DB_GEN2_SRQ_OFFSET
);
2299 int ocrdma_post_srq_recv(struct ib_srq
*ibsrq
, const struct ib_recv_wr
*wr
,
2300 const struct ib_recv_wr
**bad_wr
)
2303 unsigned long flags
;
2304 struct ocrdma_srq
*srq
;
2305 struct ocrdma_hdr_wqe
*rqe
;
2308 srq
= get_ocrdma_srq(ibsrq
);
2310 spin_lock_irqsave(&srq
->q_lock
, flags
);
2312 if (ocrdma_hwq_free_cnt(&srq
->rq
) == 0 ||
2313 wr
->num_sge
> srq
->rq
.max_sges
) {
2318 tag
= ocrdma_srq_get_idx(srq
);
2319 rqe
= ocrdma_hwq_head(&srq
->rq
);
2320 ocrdma_build_rqe(rqe
, wr
, tag
);
2322 srq
->rqe_wr_id_tbl
[tag
] = wr
->wr_id
;
2323 /* make sure rqe is written before adapter can perform DMA */
2325 /* inform hw to start processing it */
2326 ocrdma_ring_srq_db(srq
);
2327 /* update pointer, counter for next wr */
2328 ocrdma_hwq_inc_head(&srq
->rq
);
2331 spin_unlock_irqrestore(&srq
->q_lock
, flags
);
2335 static enum ib_wc_status
ocrdma_to_ibwc_err(u16 status
)
2337 enum ib_wc_status ibwc_status
;
2340 case OCRDMA_CQE_GENERAL_ERR
:
2341 ibwc_status
= IB_WC_GENERAL_ERR
;
2343 case OCRDMA_CQE_LOC_LEN_ERR
:
2344 ibwc_status
= IB_WC_LOC_LEN_ERR
;
2346 case OCRDMA_CQE_LOC_QP_OP_ERR
:
2347 ibwc_status
= IB_WC_LOC_QP_OP_ERR
;
2349 case OCRDMA_CQE_LOC_EEC_OP_ERR
:
2350 ibwc_status
= IB_WC_LOC_EEC_OP_ERR
;
2352 case OCRDMA_CQE_LOC_PROT_ERR
:
2353 ibwc_status
= IB_WC_LOC_PROT_ERR
;
2355 case OCRDMA_CQE_WR_FLUSH_ERR
:
2356 ibwc_status
= IB_WC_WR_FLUSH_ERR
;
2358 case OCRDMA_CQE_MW_BIND_ERR
:
2359 ibwc_status
= IB_WC_MW_BIND_ERR
;
2361 case OCRDMA_CQE_BAD_RESP_ERR
:
2362 ibwc_status
= IB_WC_BAD_RESP_ERR
;
2364 case OCRDMA_CQE_LOC_ACCESS_ERR
:
2365 ibwc_status
= IB_WC_LOC_ACCESS_ERR
;
2367 case OCRDMA_CQE_REM_INV_REQ_ERR
:
2368 ibwc_status
= IB_WC_REM_INV_REQ_ERR
;
2370 case OCRDMA_CQE_REM_ACCESS_ERR
:
2371 ibwc_status
= IB_WC_REM_ACCESS_ERR
;
2373 case OCRDMA_CQE_REM_OP_ERR
:
2374 ibwc_status
= IB_WC_REM_OP_ERR
;
2376 case OCRDMA_CQE_RETRY_EXC_ERR
:
2377 ibwc_status
= IB_WC_RETRY_EXC_ERR
;
2379 case OCRDMA_CQE_RNR_RETRY_EXC_ERR
:
2380 ibwc_status
= IB_WC_RNR_RETRY_EXC_ERR
;
2382 case OCRDMA_CQE_LOC_RDD_VIOL_ERR
:
2383 ibwc_status
= IB_WC_LOC_RDD_VIOL_ERR
;
2385 case OCRDMA_CQE_REM_INV_RD_REQ_ERR
:
2386 ibwc_status
= IB_WC_REM_INV_RD_REQ_ERR
;
2388 case OCRDMA_CQE_REM_ABORT_ERR
:
2389 ibwc_status
= IB_WC_REM_ABORT_ERR
;
2391 case OCRDMA_CQE_INV_EECN_ERR
:
2392 ibwc_status
= IB_WC_INV_EECN_ERR
;
2394 case OCRDMA_CQE_INV_EEC_STATE_ERR
:
2395 ibwc_status
= IB_WC_INV_EEC_STATE_ERR
;
2397 case OCRDMA_CQE_FATAL_ERR
:
2398 ibwc_status
= IB_WC_FATAL_ERR
;
2400 case OCRDMA_CQE_RESP_TIMEOUT_ERR
:
2401 ibwc_status
= IB_WC_RESP_TIMEOUT_ERR
;
2404 ibwc_status
= IB_WC_GENERAL_ERR
;
2410 static void ocrdma_update_wc(struct ocrdma_qp
*qp
, struct ib_wc
*ibwc
,
2413 struct ocrdma_hdr_wqe
*hdr
;
2414 struct ocrdma_sge
*rw
;
2417 hdr
= ocrdma_hwq_head_from_idx(&qp
->sq
, wqe_idx
);
2419 ibwc
->wr_id
= qp
->wqe_wr_id_tbl
[wqe_idx
].wrid
;
2420 /* Undo the hdr->cw swap */
2421 opcode
= le32_to_cpu(hdr
->cw
) & OCRDMA_WQE_OPCODE_MASK
;
2424 ibwc
->opcode
= IB_WC_RDMA_WRITE
;
2427 rw
= (struct ocrdma_sge
*)(hdr
+ 1);
2428 ibwc
->opcode
= IB_WC_RDMA_READ
;
2429 ibwc
->byte_len
= rw
->len
;
2432 ibwc
->opcode
= IB_WC_SEND
;
2435 ibwc
->opcode
= IB_WC_REG_MR
;
2437 case OCRDMA_LKEY_INV
:
2438 ibwc
->opcode
= IB_WC_LOCAL_INV
;
2441 ibwc
->status
= IB_WC_GENERAL_ERR
;
2442 pr_err("%s() invalid opcode received = 0x%x\n",
2443 __func__
, hdr
->cw
& OCRDMA_WQE_OPCODE_MASK
);
2448 static void ocrdma_set_cqe_status_flushed(struct ocrdma_qp
*qp
,
2449 struct ocrdma_cqe
*cqe
)
2451 if (is_cqe_for_sq(cqe
)) {
2452 cqe
->flags_status_srcqpn
= cpu_to_le32(le32_to_cpu(
2453 cqe
->flags_status_srcqpn
) &
2454 ~OCRDMA_CQE_STATUS_MASK
);
2455 cqe
->flags_status_srcqpn
= cpu_to_le32(le32_to_cpu(
2456 cqe
->flags_status_srcqpn
) |
2457 (OCRDMA_CQE_WR_FLUSH_ERR
<<
2458 OCRDMA_CQE_STATUS_SHIFT
));
2460 if (qp
->qp_type
== IB_QPT_UD
|| qp
->qp_type
== IB_QPT_GSI
) {
2461 cqe
->flags_status_srcqpn
= cpu_to_le32(le32_to_cpu(
2462 cqe
->flags_status_srcqpn
) &
2463 ~OCRDMA_CQE_UD_STATUS_MASK
);
2464 cqe
->flags_status_srcqpn
= cpu_to_le32(le32_to_cpu(
2465 cqe
->flags_status_srcqpn
) |
2466 (OCRDMA_CQE_WR_FLUSH_ERR
<<
2467 OCRDMA_CQE_UD_STATUS_SHIFT
));
2469 cqe
->flags_status_srcqpn
= cpu_to_le32(le32_to_cpu(
2470 cqe
->flags_status_srcqpn
) &
2471 ~OCRDMA_CQE_STATUS_MASK
);
2472 cqe
->flags_status_srcqpn
= cpu_to_le32(le32_to_cpu(
2473 cqe
->flags_status_srcqpn
) |
2474 (OCRDMA_CQE_WR_FLUSH_ERR
<<
2475 OCRDMA_CQE_STATUS_SHIFT
));
2480 static bool ocrdma_update_err_cqe(struct ib_wc
*ibwc
, struct ocrdma_cqe
*cqe
,
2481 struct ocrdma_qp
*qp
, int status
)
2483 bool expand
= false;
2486 ibwc
->qp
= &qp
->ibqp
;
2487 ibwc
->status
= ocrdma_to_ibwc_err(status
);
2489 ocrdma_flush_qp(qp
);
2490 ocrdma_qp_state_change(qp
, IB_QPS_ERR
, NULL
);
2492 /* if wqe/rqe pending for which cqe needs to be returned,
2493 * trigger inflating it.
2495 if (!is_hw_rq_empty(qp
) || !is_hw_sq_empty(qp
)) {
2497 ocrdma_set_cqe_status_flushed(qp
, cqe
);
2502 static int ocrdma_update_err_rcqe(struct ib_wc
*ibwc
, struct ocrdma_cqe
*cqe
,
2503 struct ocrdma_qp
*qp
, int status
)
2505 ibwc
->opcode
= IB_WC_RECV
;
2506 ibwc
->wr_id
= qp
->rqe_wr_id_tbl
[qp
->rq
.tail
];
2507 ocrdma_hwq_inc_tail(&qp
->rq
);
2509 return ocrdma_update_err_cqe(ibwc
, cqe
, qp
, status
);
2512 static int ocrdma_update_err_scqe(struct ib_wc
*ibwc
, struct ocrdma_cqe
*cqe
,
2513 struct ocrdma_qp
*qp
, int status
)
2515 ocrdma_update_wc(qp
, ibwc
, qp
->sq
.tail
);
2516 ocrdma_hwq_inc_tail(&qp
->sq
);
2518 return ocrdma_update_err_cqe(ibwc
, cqe
, qp
, status
);
2522 static bool ocrdma_poll_err_scqe(struct ocrdma_qp
*qp
,
2523 struct ocrdma_cqe
*cqe
, struct ib_wc
*ibwc
,
2524 bool *polled
, bool *stop
)
2527 struct ocrdma_dev
*dev
= get_ocrdma_dev(qp
->ibqp
.device
);
2528 int status
= (le32_to_cpu(cqe
->flags_status_srcqpn
) &
2529 OCRDMA_CQE_STATUS_MASK
) >> OCRDMA_CQE_STATUS_SHIFT
;
2530 if (status
< OCRDMA_MAX_CQE_ERR
)
2531 atomic_inc(&dev
->cqe_err_stats
[status
]);
2533 /* when hw sq is empty, but rq is not empty, so we continue
2534 * to keep the cqe in order to get the cq event again.
2536 if (is_hw_sq_empty(qp
) && !is_hw_rq_empty(qp
)) {
2537 /* when cq for rq and sq is same, it is safe to return
2538 * flush cqe for RQEs.
2540 if (!qp
->srq
&& (qp
->sq_cq
== qp
->rq_cq
)) {
2542 status
= OCRDMA_CQE_WR_FLUSH_ERR
;
2543 expand
= ocrdma_update_err_rcqe(ibwc
, cqe
, qp
, status
);
2545 /* stop processing further cqe as this cqe is used for
2546 * triggering cq event on buddy cq of RQ.
2547 * When QP is destroyed, this cqe will be removed
2548 * from the cq's hardware q.
2554 } else if (is_hw_sq_empty(qp
)) {
2561 expand
= ocrdma_update_err_scqe(ibwc
, cqe
, qp
, status
);
2566 static bool ocrdma_poll_success_scqe(struct ocrdma_qp
*qp
,
2567 struct ocrdma_cqe
*cqe
,
2568 struct ib_wc
*ibwc
, bool *polled
)
2570 bool expand
= false;
2571 int tail
= qp
->sq
.tail
;
2574 if (!qp
->wqe_wr_id_tbl
[tail
].signaled
) {
2575 *polled
= false; /* WC cannot be consumed yet */
2577 ibwc
->status
= IB_WC_SUCCESS
;
2579 ibwc
->qp
= &qp
->ibqp
;
2580 ocrdma_update_wc(qp
, ibwc
, tail
);
2583 wqe_idx
= (le32_to_cpu(cqe
->wq
.wqeidx
) &
2584 OCRDMA_CQE_WQEIDX_MASK
) & qp
->sq
.max_wqe_idx
;
2585 if (tail
!= wqe_idx
)
2586 expand
= true; /* Coalesced CQE can't be consumed yet */
2588 ocrdma_hwq_inc_tail(&qp
->sq
);
2592 static bool ocrdma_poll_scqe(struct ocrdma_qp
*qp
, struct ocrdma_cqe
*cqe
,
2593 struct ib_wc
*ibwc
, bool *polled
, bool *stop
)
2598 status
= (le32_to_cpu(cqe
->flags_status_srcqpn
) &
2599 OCRDMA_CQE_STATUS_MASK
) >> OCRDMA_CQE_STATUS_SHIFT
;
2601 if (status
== OCRDMA_CQE_SUCCESS
)
2602 expand
= ocrdma_poll_success_scqe(qp
, cqe
, ibwc
, polled
);
2604 expand
= ocrdma_poll_err_scqe(qp
, cqe
, ibwc
, polled
, stop
);
2608 static int ocrdma_update_ud_rcqe(struct ocrdma_dev
*dev
, struct ib_wc
*ibwc
,
2609 struct ocrdma_cqe
*cqe
)
2614 status
= (le32_to_cpu(cqe
->flags_status_srcqpn
) &
2615 OCRDMA_CQE_UD_STATUS_MASK
) >> OCRDMA_CQE_UD_STATUS_SHIFT
;
2616 ibwc
->src_qp
= le32_to_cpu(cqe
->flags_status_srcqpn
) &
2617 OCRDMA_CQE_SRCQP_MASK
;
2618 ibwc
->pkey_index
= 0;
2619 ibwc
->wc_flags
= IB_WC_GRH
;
2620 ibwc
->byte_len
= (le32_to_cpu(cqe
->ud
.rxlen_pkey
) >>
2621 OCRDMA_CQE_UD_XFER_LEN_SHIFT
) &
2622 OCRDMA_CQE_UD_XFER_LEN_MASK
;
2624 if (ocrdma_is_udp_encap_supported(dev
)) {
2625 hdr_type
= (le32_to_cpu(cqe
->ud
.rxlen_pkey
) >>
2626 OCRDMA_CQE_UD_L3TYPE_SHIFT
) &
2627 OCRDMA_CQE_UD_L3TYPE_MASK
;
2628 ibwc
->wc_flags
|= IB_WC_WITH_NETWORK_HDR_TYPE
;
2629 ibwc
->network_hdr_type
= hdr_type
;
2635 static void ocrdma_update_free_srq_cqe(struct ib_wc
*ibwc
,
2636 struct ocrdma_cqe
*cqe
,
2637 struct ocrdma_qp
*qp
)
2639 unsigned long flags
;
2640 struct ocrdma_srq
*srq
;
2643 srq
= get_ocrdma_srq(qp
->ibqp
.srq
);
2644 wqe_idx
= (le32_to_cpu(cqe
->rq
.buftag_qpn
) >>
2645 OCRDMA_CQE_BUFTAG_SHIFT
) & srq
->rq
.max_wqe_idx
;
2646 BUG_ON(wqe_idx
< 1);
2648 ibwc
->wr_id
= srq
->rqe_wr_id_tbl
[wqe_idx
];
2649 spin_lock_irqsave(&srq
->q_lock
, flags
);
2650 ocrdma_srq_toggle_bit(srq
, wqe_idx
- 1);
2651 spin_unlock_irqrestore(&srq
->q_lock
, flags
);
2652 ocrdma_hwq_inc_tail(&srq
->rq
);
2655 static bool ocrdma_poll_err_rcqe(struct ocrdma_qp
*qp
, struct ocrdma_cqe
*cqe
,
2656 struct ib_wc
*ibwc
, bool *polled
, bool *stop
,
2660 struct ocrdma_dev
*dev
= get_ocrdma_dev(qp
->ibqp
.device
);
2662 if (status
< OCRDMA_MAX_CQE_ERR
)
2663 atomic_inc(&dev
->cqe_err_stats
[status
]);
2665 /* when hw_rq is empty, but wq is not empty, so continue
2666 * to keep the cqe to get the cq event again.
2668 if (is_hw_rq_empty(qp
) && !is_hw_sq_empty(qp
)) {
2669 if (!qp
->srq
&& (qp
->sq_cq
== qp
->rq_cq
)) {
2671 status
= OCRDMA_CQE_WR_FLUSH_ERR
;
2672 expand
= ocrdma_update_err_scqe(ibwc
, cqe
, qp
, status
);
2678 } else if (is_hw_rq_empty(qp
)) {
2685 expand
= ocrdma_update_err_rcqe(ibwc
, cqe
, qp
, status
);
2690 static void ocrdma_poll_success_rcqe(struct ocrdma_qp
*qp
,
2691 struct ocrdma_cqe
*cqe
, struct ib_wc
*ibwc
)
2693 struct ocrdma_dev
*dev
;
2695 dev
= get_ocrdma_dev(qp
->ibqp
.device
);
2696 ibwc
->opcode
= IB_WC_RECV
;
2697 ibwc
->qp
= &qp
->ibqp
;
2698 ibwc
->status
= IB_WC_SUCCESS
;
2700 if (qp
->qp_type
== IB_QPT_UD
|| qp
->qp_type
== IB_QPT_GSI
)
2701 ocrdma_update_ud_rcqe(dev
, ibwc
, cqe
);
2703 ibwc
->byte_len
= le32_to_cpu(cqe
->rq
.rxlen
);
2705 if (is_cqe_imm(cqe
)) {
2706 ibwc
->ex
.imm_data
= htonl(le32_to_cpu(cqe
->rq
.lkey_immdt
));
2707 ibwc
->wc_flags
|= IB_WC_WITH_IMM
;
2708 } else if (is_cqe_wr_imm(cqe
)) {
2709 ibwc
->opcode
= IB_WC_RECV_RDMA_WITH_IMM
;
2710 ibwc
->ex
.imm_data
= htonl(le32_to_cpu(cqe
->rq
.lkey_immdt
));
2711 ibwc
->wc_flags
|= IB_WC_WITH_IMM
;
2712 } else if (is_cqe_invalidated(cqe
)) {
2713 ibwc
->ex
.invalidate_rkey
= le32_to_cpu(cqe
->rq
.lkey_immdt
);
2714 ibwc
->wc_flags
|= IB_WC_WITH_INVALIDATE
;
2717 ocrdma_update_free_srq_cqe(ibwc
, cqe
, qp
);
2719 ibwc
->wr_id
= qp
->rqe_wr_id_tbl
[qp
->rq
.tail
];
2720 ocrdma_hwq_inc_tail(&qp
->rq
);
2724 static bool ocrdma_poll_rcqe(struct ocrdma_qp
*qp
, struct ocrdma_cqe
*cqe
,
2725 struct ib_wc
*ibwc
, bool *polled
, bool *stop
)
2728 bool expand
= false;
2731 if (qp
->qp_type
== IB_QPT_UD
|| qp
->qp_type
== IB_QPT_GSI
) {
2732 status
= (le32_to_cpu(cqe
->flags_status_srcqpn
) &
2733 OCRDMA_CQE_UD_STATUS_MASK
) >>
2734 OCRDMA_CQE_UD_STATUS_SHIFT
;
2736 status
= (le32_to_cpu(cqe
->flags_status_srcqpn
) &
2737 OCRDMA_CQE_STATUS_MASK
) >> OCRDMA_CQE_STATUS_SHIFT
;
2740 if (status
== OCRDMA_CQE_SUCCESS
) {
2742 ocrdma_poll_success_rcqe(qp
, cqe
, ibwc
);
2744 expand
= ocrdma_poll_err_rcqe(qp
, cqe
, ibwc
, polled
, stop
,
2750 static void ocrdma_change_cq_phase(struct ocrdma_cq
*cq
, struct ocrdma_cqe
*cqe
,
2753 if (cq
->phase_change
) {
2755 cq
->phase
= (~cq
->phase
& OCRDMA_CQE_VALID
);
2757 /* clear valid bit */
2758 cqe
->flags_status_srcqpn
= 0;
2762 static int ocrdma_poll_hwcq(struct ocrdma_cq
*cq
, int num_entries
,
2767 bool expand
= false;
2768 int polled_hw_cqes
= 0;
2769 struct ocrdma_qp
*qp
= NULL
;
2770 struct ocrdma_dev
*dev
= get_ocrdma_dev(cq
->ibcq
.device
);
2771 struct ocrdma_cqe
*cqe
;
2772 u16 cur_getp
; bool polled
= false; bool stop
= false;
2774 cur_getp
= cq
->getp
;
2775 while (num_entries
) {
2776 cqe
= cq
->va
+ cur_getp
;
2777 /* check whether valid cqe or not */
2778 if (!is_cqe_valid(cq
, cqe
))
2780 qpn
= (le32_to_cpu(cqe
->cmn
.qpn
) & OCRDMA_CQE_QPN_MASK
);
2781 /* ignore discarded cqe */
2784 qp
= dev
->qp_tbl
[qpn
];
2787 if (is_cqe_for_sq(cqe
)) {
2788 expand
= ocrdma_poll_scqe(qp
, cqe
, ibwc
, &polled
,
2791 expand
= ocrdma_poll_rcqe(qp
, cqe
, ibwc
, &polled
,
2798 /* clear qpn to avoid duplicate processing by discard_cqe() */
2801 polled_hw_cqes
+= 1;
2802 cur_getp
= (cur_getp
+ 1) % cq
->max_hw_cqe
;
2803 ocrdma_change_cq_phase(cq
, cqe
, cur_getp
);
2813 cq
->getp
= cur_getp
;
2816 ocrdma_ring_cq_db(dev
, cq
->id
, false, false, polled_hw_cqes
);
2821 /* insert error cqe if the QP's SQ or RQ's CQ matches the CQ under poll. */
2822 static int ocrdma_add_err_cqe(struct ocrdma_cq
*cq
, int num_entries
,
2823 struct ocrdma_qp
*qp
, struct ib_wc
*ibwc
)
2827 while (num_entries
) {
2828 if (is_hw_sq_empty(qp
) && is_hw_rq_empty(qp
))
2830 if (!is_hw_sq_empty(qp
) && qp
->sq_cq
== cq
) {
2831 ocrdma_update_wc(qp
, ibwc
, qp
->sq
.tail
);
2832 ocrdma_hwq_inc_tail(&qp
->sq
);
2833 } else if (!is_hw_rq_empty(qp
) && qp
->rq_cq
== cq
) {
2834 ibwc
->wr_id
= qp
->rqe_wr_id_tbl
[qp
->rq
.tail
];
2835 ocrdma_hwq_inc_tail(&qp
->rq
);
2840 ibwc
->status
= IB_WC_WR_FLUSH_ERR
;
2848 int ocrdma_poll_cq(struct ib_cq
*ibcq
, int num_entries
, struct ib_wc
*wc
)
2850 int cqes_to_poll
= num_entries
;
2851 struct ocrdma_cq
*cq
= get_ocrdma_cq(ibcq
);
2852 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibcq
->device
);
2853 int num_os_cqe
= 0, err_cqes
= 0;
2854 struct ocrdma_qp
*qp
;
2855 unsigned long flags
;
2857 /* poll cqes from adapter CQ */
2858 spin_lock_irqsave(&cq
->cq_lock
, flags
);
2859 num_os_cqe
= ocrdma_poll_hwcq(cq
, cqes_to_poll
, wc
);
2860 spin_unlock_irqrestore(&cq
->cq_lock
, flags
);
2861 cqes_to_poll
-= num_os_cqe
;
2864 wc
= wc
+ num_os_cqe
;
2865 /* adapter returns single error cqe when qp moves to
2866 * error state. So insert error cqes with wc_status as
2867 * FLUSHED for pending WQEs and RQEs of QP's SQ and RQ
2868 * respectively which uses this CQ.
2870 spin_lock_irqsave(&dev
->flush_q_lock
, flags
);
2871 list_for_each_entry(qp
, &cq
->sq_head
, sq_entry
) {
2872 if (cqes_to_poll
== 0)
2874 err_cqes
= ocrdma_add_err_cqe(cq
, cqes_to_poll
, qp
, wc
);
2875 cqes_to_poll
-= err_cqes
;
2876 num_os_cqe
+= err_cqes
;
2879 spin_unlock_irqrestore(&dev
->flush_q_lock
, flags
);
2884 int ocrdma_arm_cq(struct ib_cq
*ibcq
, enum ib_cq_notify_flags cq_flags
)
2886 struct ocrdma_cq
*cq
= get_ocrdma_cq(ibcq
);
2887 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibcq
->device
);
2889 unsigned long flags
;
2890 bool arm_needed
= false, sol_needed
= false;
2894 spin_lock_irqsave(&cq
->cq_lock
, flags
);
2895 if (cq_flags
& IB_CQ_NEXT_COMP
|| cq_flags
& IB_CQ_SOLICITED
)
2897 if (cq_flags
& IB_CQ_SOLICITED
)
2900 ocrdma_ring_cq_db(dev
, cq_id
, arm_needed
, sol_needed
, 0);
2901 spin_unlock_irqrestore(&cq
->cq_lock
, flags
);
2906 struct ib_mr
*ocrdma_alloc_mr(struct ib_pd
*ibpd
, enum ib_mr_type mr_type
,
2910 struct ocrdma_mr
*mr
;
2911 struct ocrdma_pd
*pd
= get_ocrdma_pd(ibpd
);
2912 struct ocrdma_dev
*dev
= get_ocrdma_dev(ibpd
->device
);
2914 if (mr_type
!= IB_MR_TYPE_MEM_REG
)
2915 return ERR_PTR(-EINVAL
);
2917 if (max_num_sg
> dev
->attr
.max_pages_per_frmr
)
2918 return ERR_PTR(-EINVAL
);
2920 mr
= kzalloc(sizeof(*mr
), GFP_KERNEL
);
2922 return ERR_PTR(-ENOMEM
);
2924 mr
->pages
= kcalloc(max_num_sg
, sizeof(u64
), GFP_KERNEL
);
2930 status
= ocrdma_get_pbl_info(dev
, mr
, max_num_sg
);
2934 mr
->hwmr
.remote_rd
= 0;
2935 mr
->hwmr
.remote_wr
= 0;
2936 mr
->hwmr
.local_rd
= 0;
2937 mr
->hwmr
.local_wr
= 0;
2938 mr
->hwmr
.mw_bind
= 0;
2939 status
= ocrdma_build_pbl_tbl(dev
, &mr
->hwmr
);
2942 status
= ocrdma_reg_mr(dev
, &mr
->hwmr
, pd
->id
, 0);
2945 mr
->ibmr
.rkey
= mr
->hwmr
.lkey
;
2946 mr
->ibmr
.lkey
= mr
->hwmr
.lkey
;
2947 dev
->stag_arr
[(mr
->hwmr
.lkey
>> 8) & (OCRDMA_MAX_STAG
- 1)] =
2951 ocrdma_free_mr_pbl_tbl(dev
, &mr
->hwmr
);
2956 return ERR_PTR(-ENOMEM
);
2959 static int ocrdma_set_page(struct ib_mr
*ibmr
, u64 addr
)
2961 struct ocrdma_mr
*mr
= get_ocrdma_mr(ibmr
);
2963 if (unlikely(mr
->npages
== mr
->hwmr
.num_pbes
))
2966 mr
->pages
[mr
->npages
++] = addr
;
2971 int ocrdma_map_mr_sg(struct ib_mr
*ibmr
, struct scatterlist
*sg
, int sg_nents
,
2972 unsigned int *sg_offset
)
2974 struct ocrdma_mr
*mr
= get_ocrdma_mr(ibmr
);
2978 return ib_sg_to_pages(ibmr
, sg
, sg_nents
, sg_offset
, ocrdma_set_page
);