1 // SPDX-License-Identifier: GPL-2.0-only
3 * Copyright (c) 2016 HGST, a Western Digital Company.
5 #include <linux/moduleparam.h>
6 #include <linux/slab.h>
7 #include <linux/pci-p2pdma.h>
8 #include <rdma/mr_pool.h>
18 static bool rdma_rw_force_mr
;
19 module_param_named(force_mr
, rdma_rw_force_mr
, bool, 0);
20 MODULE_PARM_DESC(force_mr
, "Force usage of MRs for RDMA READ/WRITE operations");
23 * Report whether memory registration should be used. Memory registration must
24 * be used for iWarp devices because of iWARP-specific limitations. Memory
25 * registration is also enabled if registering memory might yield better
26 * performance than using multiple SGE entries, see rdma_rw_io_needs_mr()
28 static inline bool rdma_rw_can_use_mr(struct ib_device
*dev
, u8 port_num
)
30 if (rdma_protocol_iwarp(dev
, port_num
))
32 if (dev
->attrs
.max_sgl_rd
)
34 if (unlikely(rdma_rw_force_mr
))
40 * Check if the device will use memory registration for this RW operation.
41 * For RDMA READs we must use MRs on iWarp and can optionally use them as an
42 * optimization otherwise. Additionally we have a debug option to force usage
43 * of MRs to help testing this code path.
45 static inline bool rdma_rw_io_needs_mr(struct ib_device
*dev
, u8 port_num
,
46 enum dma_data_direction dir
, int dma_nents
)
48 if (dir
== DMA_FROM_DEVICE
) {
49 if (rdma_protocol_iwarp(dev
, port_num
))
51 if (dev
->attrs
.max_sgl_rd
&& dma_nents
> dev
->attrs
.max_sgl_rd
)
54 if (unlikely(rdma_rw_force_mr
))
59 static inline u32
rdma_rw_fr_page_list_len(struct ib_device
*dev
,
65 max_pages
= dev
->attrs
.max_pi_fast_reg_page_list_len
;
67 max_pages
= dev
->attrs
.max_fast_reg_page_list_len
;
69 /* arbitrary limit to avoid allocating gigantic resources */
70 return min_t(u32
, max_pages
, 256);
73 static inline int rdma_rw_inv_key(struct rdma_rw_reg_ctx
*reg
)
77 if (reg
->mr
->need_inval
) {
78 reg
->inv_wr
.opcode
= IB_WR_LOCAL_INV
;
79 reg
->inv_wr
.ex
.invalidate_rkey
= reg
->mr
->lkey
;
80 reg
->inv_wr
.next
= ®
->reg_wr
.wr
;
83 reg
->inv_wr
.next
= NULL
;
89 /* Caller must have zero-initialized *reg. */
90 static int rdma_rw_init_one_mr(struct ib_qp
*qp
, u8 port_num
,
91 struct rdma_rw_reg_ctx
*reg
, struct scatterlist
*sg
,
92 u32 sg_cnt
, u32 offset
)
94 u32 pages_per_mr
= rdma_rw_fr_page_list_len(qp
->pd
->device
,
96 u32 nents
= min(sg_cnt
, pages_per_mr
);
99 reg
->mr
= ib_mr_pool_get(qp
, &qp
->rdma_mrs
);
103 count
+= rdma_rw_inv_key(reg
);
105 ret
= ib_map_mr_sg(reg
->mr
, sg
, nents
, &offset
, PAGE_SIZE
);
106 if (ret
< 0 || ret
< nents
) {
107 ib_mr_pool_put(qp
, &qp
->rdma_mrs
, reg
->mr
);
111 reg
->reg_wr
.wr
.opcode
= IB_WR_REG_MR
;
112 reg
->reg_wr
.mr
= reg
->mr
;
113 reg
->reg_wr
.access
= IB_ACCESS_LOCAL_WRITE
;
114 if (rdma_protocol_iwarp(qp
->device
, port_num
))
115 reg
->reg_wr
.access
|= IB_ACCESS_REMOTE_WRITE
;
118 reg
->sge
.addr
= reg
->mr
->iova
;
119 reg
->sge
.length
= reg
->mr
->length
;
123 static int rdma_rw_init_mr_wrs(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
,
124 u8 port_num
, struct scatterlist
*sg
, u32 sg_cnt
, u32 offset
,
125 u64 remote_addr
, u32 rkey
, enum dma_data_direction dir
)
127 struct rdma_rw_reg_ctx
*prev
= NULL
;
128 u32 pages_per_mr
= rdma_rw_fr_page_list_len(qp
->pd
->device
,
130 int i
, j
, ret
= 0, count
= 0;
132 ctx
->nr_ops
= (sg_cnt
+ pages_per_mr
- 1) / pages_per_mr
;
133 ctx
->reg
= kcalloc(ctx
->nr_ops
, sizeof(*ctx
->reg
), GFP_KERNEL
);
139 for (i
= 0; i
< ctx
->nr_ops
; i
++) {
140 struct rdma_rw_reg_ctx
*reg
= &ctx
->reg
[i
];
141 u32 nents
= min(sg_cnt
, pages_per_mr
);
143 ret
= rdma_rw_init_one_mr(qp
, port_num
, reg
, sg
, sg_cnt
,
150 if (reg
->mr
->need_inval
)
151 prev
->wr
.wr
.next
= ®
->inv_wr
;
153 prev
->wr
.wr
.next
= ®
->reg_wr
.wr
;
156 reg
->reg_wr
.wr
.next
= ®
->wr
.wr
;
158 reg
->wr
.wr
.sg_list
= ®
->sge
;
159 reg
->wr
.wr
.num_sge
= 1;
160 reg
->wr
.remote_addr
= remote_addr
;
162 if (dir
== DMA_TO_DEVICE
) {
163 reg
->wr
.wr
.opcode
= IB_WR_RDMA_WRITE
;
164 } else if (!rdma_cap_read_inv(qp
->device
, port_num
)) {
165 reg
->wr
.wr
.opcode
= IB_WR_RDMA_READ
;
167 reg
->wr
.wr
.opcode
= IB_WR_RDMA_READ_WITH_INV
;
168 reg
->wr
.wr
.ex
.invalidate_rkey
= reg
->mr
->lkey
;
172 remote_addr
+= reg
->sge
.length
;
174 for (j
= 0; j
< nents
; j
++)
181 prev
->wr
.wr
.next
= NULL
;
183 ctx
->type
= RDMA_RW_MR
;
188 ib_mr_pool_put(qp
, &qp
->rdma_mrs
, ctx
->reg
[i
].mr
);
194 static int rdma_rw_init_map_wrs(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
,
195 struct scatterlist
*sg
, u32 sg_cnt
, u32 offset
,
196 u64 remote_addr
, u32 rkey
, enum dma_data_direction dir
)
198 u32 max_sge
= dir
== DMA_TO_DEVICE
? qp
->max_write_sge
:
201 u32 total_len
= 0, i
, j
;
203 ctx
->nr_ops
= DIV_ROUND_UP(sg_cnt
, max_sge
);
205 ctx
->map
.sges
= sge
= kcalloc(sg_cnt
, sizeof(*sge
), GFP_KERNEL
);
209 ctx
->map
.wrs
= kcalloc(ctx
->nr_ops
, sizeof(*ctx
->map
.wrs
), GFP_KERNEL
);
213 for (i
= 0; i
< ctx
->nr_ops
; i
++) {
214 struct ib_rdma_wr
*rdma_wr
= &ctx
->map
.wrs
[i
];
215 u32 nr_sge
= min(sg_cnt
, max_sge
);
217 if (dir
== DMA_TO_DEVICE
)
218 rdma_wr
->wr
.opcode
= IB_WR_RDMA_WRITE
;
220 rdma_wr
->wr
.opcode
= IB_WR_RDMA_READ
;
221 rdma_wr
->remote_addr
= remote_addr
+ total_len
;
222 rdma_wr
->rkey
= rkey
;
223 rdma_wr
->wr
.num_sge
= nr_sge
;
224 rdma_wr
->wr
.sg_list
= sge
;
226 for (j
= 0; j
< nr_sge
; j
++, sg
= sg_next(sg
)) {
227 sge
->addr
= sg_dma_address(sg
) + offset
;
228 sge
->length
= sg_dma_len(sg
) - offset
;
229 sge
->lkey
= qp
->pd
->local_dma_lkey
;
231 total_len
+= sge
->length
;
237 rdma_wr
->wr
.next
= i
+ 1 < ctx
->nr_ops
?
238 &ctx
->map
.wrs
[i
+ 1].wr
: NULL
;
241 ctx
->type
= RDMA_RW_MULTI_WR
;
245 kfree(ctx
->map
.sges
);
250 static int rdma_rw_init_single_wr(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
,
251 struct scatterlist
*sg
, u32 offset
, u64 remote_addr
, u32 rkey
,
252 enum dma_data_direction dir
)
254 struct ib_rdma_wr
*rdma_wr
= &ctx
->single
.wr
;
258 ctx
->single
.sge
.lkey
= qp
->pd
->local_dma_lkey
;
259 ctx
->single
.sge
.addr
= sg_dma_address(sg
) + offset
;
260 ctx
->single
.sge
.length
= sg_dma_len(sg
) - offset
;
262 memset(rdma_wr
, 0, sizeof(*rdma_wr
));
263 if (dir
== DMA_TO_DEVICE
)
264 rdma_wr
->wr
.opcode
= IB_WR_RDMA_WRITE
;
266 rdma_wr
->wr
.opcode
= IB_WR_RDMA_READ
;
267 rdma_wr
->wr
.sg_list
= &ctx
->single
.sge
;
268 rdma_wr
->wr
.num_sge
= 1;
269 rdma_wr
->remote_addr
= remote_addr
;
270 rdma_wr
->rkey
= rkey
;
272 ctx
->type
= RDMA_RW_SINGLE_WR
;
277 * rdma_rw_ctx_init - initialize a RDMA READ/WRITE context
278 * @ctx: context to initialize
279 * @qp: queue pair to operate on
280 * @port_num: port num to which the connection is bound
281 * @sg: scatterlist to READ/WRITE from/to
282 * @sg_cnt: number of entries in @sg
283 * @sg_offset: current byte offset into @sg
284 * @remote_addr:remote address to read/write (relative to @rkey)
285 * @rkey: remote key to operate on
286 * @dir: %DMA_TO_DEVICE for RDMA WRITE, %DMA_FROM_DEVICE for RDMA READ
288 * Returns the number of WQEs that will be needed on the workqueue if
289 * successful, or a negative error code.
291 int rdma_rw_ctx_init(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
, u8 port_num
,
292 struct scatterlist
*sg
, u32 sg_cnt
, u32 sg_offset
,
293 u64 remote_addr
, u32 rkey
, enum dma_data_direction dir
)
295 struct ib_device
*dev
= qp
->pd
->device
;
298 if (is_pci_p2pdma_page(sg_page(sg
)))
299 ret
= pci_p2pdma_map_sg(dev
->dma_device
, sg
, sg_cnt
, dir
);
301 ret
= ib_dma_map_sg(dev
, sg
, sg_cnt
, dir
);
308 * Skip to the S/G entry that sg_offset falls into:
311 u32 len
= sg_dma_len(sg
);
322 if (WARN_ON_ONCE(sg_cnt
== 0))
325 if (rdma_rw_io_needs_mr(qp
->device
, port_num
, dir
, sg_cnt
)) {
326 ret
= rdma_rw_init_mr_wrs(ctx
, qp
, port_num
, sg
, sg_cnt
,
327 sg_offset
, remote_addr
, rkey
, dir
);
328 } else if (sg_cnt
> 1) {
329 ret
= rdma_rw_init_map_wrs(ctx
, qp
, sg
, sg_cnt
, sg_offset
,
330 remote_addr
, rkey
, dir
);
332 ret
= rdma_rw_init_single_wr(ctx
, qp
, sg
, sg_offset
,
333 remote_addr
, rkey
, dir
);
341 ib_dma_unmap_sg(dev
, sg
, sg_cnt
, dir
);
344 EXPORT_SYMBOL(rdma_rw_ctx_init
);
347 * rdma_rw_ctx_signature_init - initialize a RW context with signature offload
348 * @ctx: context to initialize
349 * @qp: queue pair to operate on
350 * @port_num: port num to which the connection is bound
351 * @sg: scatterlist to READ/WRITE from/to
352 * @sg_cnt: number of entries in @sg
353 * @prot_sg: scatterlist to READ/WRITE protection information from/to
354 * @prot_sg_cnt: number of entries in @prot_sg
355 * @sig_attrs: signature offloading algorithms
356 * @remote_addr:remote address to read/write (relative to @rkey)
357 * @rkey: remote key to operate on
358 * @dir: %DMA_TO_DEVICE for RDMA WRITE, %DMA_FROM_DEVICE for RDMA READ
360 * Returns the number of WQEs that will be needed on the workqueue if
361 * successful, or a negative error code.
363 int rdma_rw_ctx_signature_init(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
,
364 u8 port_num
, struct scatterlist
*sg
, u32 sg_cnt
,
365 struct scatterlist
*prot_sg
, u32 prot_sg_cnt
,
366 struct ib_sig_attrs
*sig_attrs
,
367 u64 remote_addr
, u32 rkey
, enum dma_data_direction dir
)
369 struct ib_device
*dev
= qp
->pd
->device
;
370 u32 pages_per_mr
= rdma_rw_fr_page_list_len(qp
->pd
->device
,
372 struct ib_rdma_wr
*rdma_wr
;
375 if (sg_cnt
> pages_per_mr
|| prot_sg_cnt
> pages_per_mr
) {
376 pr_err("SG count too large: sg_cnt=%d, prot_sg_cnt=%d, pages_per_mr=%d\n",
377 sg_cnt
, prot_sg_cnt
, pages_per_mr
);
381 ret
= ib_dma_map_sg(dev
, sg
, sg_cnt
, dir
);
387 ret
= ib_dma_map_sg(dev
, prot_sg
, prot_sg_cnt
, dir
);
395 ctx
->type
= RDMA_RW_SIG_MR
;
397 ctx
->reg
= kcalloc(1, sizeof(*ctx
->reg
), GFP_KERNEL
);
400 goto out_unmap_prot_sg
;
403 ctx
->reg
->mr
= ib_mr_pool_get(qp
, &qp
->sig_mrs
);
409 count
+= rdma_rw_inv_key(ctx
->reg
);
411 memcpy(ctx
->reg
->mr
->sig_attrs
, sig_attrs
, sizeof(struct ib_sig_attrs
));
413 ret
= ib_map_mr_sg_pi(ctx
->reg
->mr
, sg
, sg_cnt
, NULL
, prot_sg
,
414 prot_sg_cnt
, NULL
, SZ_4K
);
416 pr_err("failed to map PI sg (%d)\n", sg_cnt
+ prot_sg_cnt
);
417 goto out_destroy_sig_mr
;
420 ctx
->reg
->reg_wr
.wr
.opcode
= IB_WR_REG_MR_INTEGRITY
;
421 ctx
->reg
->reg_wr
.wr
.wr_cqe
= NULL
;
422 ctx
->reg
->reg_wr
.wr
.num_sge
= 0;
423 ctx
->reg
->reg_wr
.wr
.send_flags
= 0;
424 ctx
->reg
->reg_wr
.access
= IB_ACCESS_LOCAL_WRITE
;
425 if (rdma_protocol_iwarp(qp
->device
, port_num
))
426 ctx
->reg
->reg_wr
.access
|= IB_ACCESS_REMOTE_WRITE
;
427 ctx
->reg
->reg_wr
.mr
= ctx
->reg
->mr
;
428 ctx
->reg
->reg_wr
.key
= ctx
->reg
->mr
->lkey
;
431 ctx
->reg
->sge
.addr
= ctx
->reg
->mr
->iova
;
432 ctx
->reg
->sge
.length
= ctx
->reg
->mr
->length
;
433 if (sig_attrs
->wire
.sig_type
== IB_SIG_TYPE_NONE
)
434 ctx
->reg
->sge
.length
-= ctx
->reg
->mr
->sig_attrs
->meta_length
;
436 rdma_wr
= &ctx
->reg
->wr
;
437 rdma_wr
->wr
.sg_list
= &ctx
->reg
->sge
;
438 rdma_wr
->wr
.num_sge
= 1;
439 rdma_wr
->remote_addr
= remote_addr
;
440 rdma_wr
->rkey
= rkey
;
441 if (dir
== DMA_TO_DEVICE
)
442 rdma_wr
->wr
.opcode
= IB_WR_RDMA_WRITE
;
444 rdma_wr
->wr
.opcode
= IB_WR_RDMA_READ
;
445 ctx
->reg
->reg_wr
.wr
.next
= &rdma_wr
->wr
;
451 ib_mr_pool_put(qp
, &qp
->sig_mrs
, ctx
->reg
->mr
);
456 ib_dma_unmap_sg(dev
, prot_sg
, prot_sg_cnt
, dir
);
458 ib_dma_unmap_sg(dev
, sg
, sg_cnt
, dir
);
461 EXPORT_SYMBOL(rdma_rw_ctx_signature_init
);
464 * Now that we are going to post the WRs we can update the lkey and need_inval
465 * state on the MRs. If we were doing this at init time, we would get double
466 * or missing invalidations if a context was initialized but not actually
469 static void rdma_rw_update_lkey(struct rdma_rw_reg_ctx
*reg
, bool need_inval
)
471 reg
->mr
->need_inval
= need_inval
;
472 ib_update_fast_reg_key(reg
->mr
, ib_inc_rkey(reg
->mr
->lkey
));
473 reg
->reg_wr
.key
= reg
->mr
->lkey
;
474 reg
->sge
.lkey
= reg
->mr
->lkey
;
478 * rdma_rw_ctx_wrs - return chain of WRs for a RDMA READ or WRITE operation
479 * @ctx: context to operate on
480 * @qp: queue pair to operate on
481 * @port_num: port num to which the connection is bound
482 * @cqe: completion queue entry for the last WR
483 * @chain_wr: WR to append to the posted chain
485 * Return the WR chain for the set of RDMA READ/WRITE operations described by
486 * @ctx, as well as any memory registration operations needed. If @chain_wr
487 * is non-NULL the WR it points to will be appended to the chain of WRs posted.
488 * If @chain_wr is not set @cqe must be set so that the caller gets a
489 * completion notification.
491 struct ib_send_wr
*rdma_rw_ctx_wrs(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
,
492 u8 port_num
, struct ib_cqe
*cqe
, struct ib_send_wr
*chain_wr
)
494 struct ib_send_wr
*first_wr
, *last_wr
;
501 for (i
= 0; i
< ctx
->nr_ops
; i
++) {
502 rdma_rw_update_lkey(&ctx
->reg
[i
],
503 ctx
->reg
[i
].wr
.wr
.opcode
!=
504 IB_WR_RDMA_READ_WITH_INV
);
507 if (ctx
->reg
[0].inv_wr
.next
)
508 first_wr
= &ctx
->reg
[0].inv_wr
;
510 first_wr
= &ctx
->reg
[0].reg_wr
.wr
;
511 last_wr
= &ctx
->reg
[ctx
->nr_ops
- 1].wr
.wr
;
513 case RDMA_RW_MULTI_WR
:
514 first_wr
= &ctx
->map
.wrs
[0].wr
;
515 last_wr
= &ctx
->map
.wrs
[ctx
->nr_ops
- 1].wr
;
517 case RDMA_RW_SINGLE_WR
:
518 first_wr
= &ctx
->single
.wr
.wr
;
519 last_wr
= &ctx
->single
.wr
.wr
;
526 last_wr
->next
= chain_wr
;
528 last_wr
->wr_cqe
= cqe
;
529 last_wr
->send_flags
|= IB_SEND_SIGNALED
;
534 EXPORT_SYMBOL(rdma_rw_ctx_wrs
);
537 * rdma_rw_ctx_post - post a RDMA READ or RDMA WRITE operation
538 * @ctx: context to operate on
539 * @qp: queue pair to operate on
540 * @port_num: port num to which the connection is bound
541 * @cqe: completion queue entry for the last WR
542 * @chain_wr: WR to append to the posted chain
544 * Post the set of RDMA READ/WRITE operations described by @ctx, as well as
545 * any memory registration operations needed. If @chain_wr is non-NULL the
546 * WR it points to will be appended to the chain of WRs posted. If @chain_wr
547 * is not set @cqe must be set so that the caller gets a completion
550 int rdma_rw_ctx_post(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
, u8 port_num
,
551 struct ib_cqe
*cqe
, struct ib_send_wr
*chain_wr
)
553 struct ib_send_wr
*first_wr
;
555 first_wr
= rdma_rw_ctx_wrs(ctx
, qp
, port_num
, cqe
, chain_wr
);
556 return ib_post_send(qp
, first_wr
, NULL
);
558 EXPORT_SYMBOL(rdma_rw_ctx_post
);
561 * rdma_rw_ctx_destroy - release all resources allocated by rdma_rw_ctx_init
562 * @ctx: context to release
563 * @qp: queue pair to operate on
564 * @port_num: port num to which the connection is bound
565 * @sg: scatterlist that was used for the READ/WRITE
566 * @sg_cnt: number of entries in @sg
567 * @dir: %DMA_TO_DEVICE for RDMA WRITE, %DMA_FROM_DEVICE for RDMA READ
569 void rdma_rw_ctx_destroy(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
, u8 port_num
,
570 struct scatterlist
*sg
, u32 sg_cnt
, enum dma_data_direction dir
)
576 for (i
= 0; i
< ctx
->nr_ops
; i
++)
577 ib_mr_pool_put(qp
, &qp
->rdma_mrs
, ctx
->reg
[i
].mr
);
580 case RDMA_RW_MULTI_WR
:
582 kfree(ctx
->map
.sges
);
584 case RDMA_RW_SINGLE_WR
:
591 if (is_pci_p2pdma_page(sg_page(sg
)))
592 pci_p2pdma_unmap_sg(qp
->pd
->device
->dma_device
, sg
,
595 ib_dma_unmap_sg(qp
->pd
->device
, sg
, sg_cnt
, dir
);
597 EXPORT_SYMBOL(rdma_rw_ctx_destroy
);
600 * rdma_rw_ctx_destroy_signature - release all resources allocated by
601 * rdma_rw_ctx_signature_init
602 * @ctx: context to release
603 * @qp: queue pair to operate on
604 * @port_num: port num to which the connection is bound
605 * @sg: scatterlist that was used for the READ/WRITE
606 * @sg_cnt: number of entries in @sg
607 * @prot_sg: scatterlist that was used for the READ/WRITE of the PI
608 * @prot_sg_cnt: number of entries in @prot_sg
609 * @dir: %DMA_TO_DEVICE for RDMA WRITE, %DMA_FROM_DEVICE for RDMA READ
611 void rdma_rw_ctx_destroy_signature(struct rdma_rw_ctx
*ctx
, struct ib_qp
*qp
,
612 u8 port_num
, struct scatterlist
*sg
, u32 sg_cnt
,
613 struct scatterlist
*prot_sg
, u32 prot_sg_cnt
,
614 enum dma_data_direction dir
)
616 if (WARN_ON_ONCE(ctx
->type
!= RDMA_RW_SIG_MR
))
619 ib_mr_pool_put(qp
, &qp
->sig_mrs
, ctx
->reg
->mr
);
622 ib_dma_unmap_sg(qp
->pd
->device
, sg
, sg_cnt
, dir
);
624 ib_dma_unmap_sg(qp
->pd
->device
, prot_sg
, prot_sg_cnt
, dir
);
626 EXPORT_SYMBOL(rdma_rw_ctx_destroy_signature
);
629 * rdma_rw_mr_factor - return number of MRs required for a payload
630 * @device: device handling the connection
631 * @port_num: port num to which the connection is bound
632 * @maxpages: maximum payload pages per rdma_rw_ctx
634 * Returns the number of MRs the device requires to move @maxpayload
635 * bytes. The returned value is used during transport creation to
636 * compute max_rdma_ctxts and the size of the transport's Send and
637 * Send Completion Queues.
639 unsigned int rdma_rw_mr_factor(struct ib_device
*device
, u8 port_num
,
640 unsigned int maxpages
)
642 unsigned int mr_pages
;
644 if (rdma_rw_can_use_mr(device
, port_num
))
645 mr_pages
= rdma_rw_fr_page_list_len(device
, false);
647 mr_pages
= device
->attrs
.max_sge_rd
;
648 return DIV_ROUND_UP(maxpages
, mr_pages
);
650 EXPORT_SYMBOL(rdma_rw_mr_factor
);
652 void rdma_rw_init_qp(struct ib_device
*dev
, struct ib_qp_init_attr
*attr
)
656 WARN_ON_ONCE(attr
->port_num
== 0);
659 * Each context needs at least one RDMA READ or WRITE WR.
661 * For some hardware we might need more, eventually we should ask the
662 * HCA driver for a multiplier here.
667 * If the devices needs MRs to perform RDMA READ or WRITE operations,
668 * we'll need two additional MRs for the registrations and the
671 if (attr
->create_flags
& IB_QP_CREATE_INTEGRITY_EN
||
672 rdma_rw_can_use_mr(dev
, attr
->port_num
))
673 factor
+= 2; /* inv + reg */
675 attr
->cap
.max_send_wr
+= factor
* attr
->cap
.max_rdma_ctxs
;
678 * But maybe we were just too high in the sky and the device doesn't
679 * even support all we need, and we'll have to live with what we get..
681 attr
->cap
.max_send_wr
=
682 min_t(u32
, attr
->cap
.max_send_wr
, dev
->attrs
.max_qp_wr
);
685 int rdma_rw_init_mrs(struct ib_qp
*qp
, struct ib_qp_init_attr
*attr
)
687 struct ib_device
*dev
= qp
->pd
->device
;
688 u32 nr_mrs
= 0, nr_sig_mrs
= 0, max_num_sg
= 0;
691 if (attr
->create_flags
& IB_QP_CREATE_INTEGRITY_EN
) {
692 nr_sig_mrs
= attr
->cap
.max_rdma_ctxs
;
693 nr_mrs
= attr
->cap
.max_rdma_ctxs
;
694 max_num_sg
= rdma_rw_fr_page_list_len(dev
, true);
695 } else if (rdma_rw_can_use_mr(dev
, attr
->port_num
)) {
696 nr_mrs
= attr
->cap
.max_rdma_ctxs
;
697 max_num_sg
= rdma_rw_fr_page_list_len(dev
, false);
701 ret
= ib_mr_pool_init(qp
, &qp
->rdma_mrs
, nr_mrs
,
705 pr_err("%s: failed to allocated %d MRs\n",
712 ret
= ib_mr_pool_init(qp
, &qp
->sig_mrs
, nr_sig_mrs
,
713 IB_MR_TYPE_INTEGRITY
, max_num_sg
, max_num_sg
);
715 pr_err("%s: failed to allocated %d SIG MRs\n",
716 __func__
, nr_sig_mrs
);
717 goto out_free_rdma_mrs
;
724 ib_mr_pool_destroy(qp
, &qp
->rdma_mrs
);
728 void rdma_rw_cleanup_mrs(struct ib_qp
*qp
)
730 ib_mr_pool_destroy(qp
, &qp
->sig_mrs
);
731 ib_mr_pool_destroy(qp
, &qp
->rdma_mrs
);