2 * Copyright(c) 2015, 2016 Intel Corporation.
4 * This file is provided under a dual BSD/GPLv2 license. When using or
5 * redistributing this file, you may do so under either license.
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of version 2 of the GNU General Public License as
11 * published by the Free Software Foundation.
13 * This program is distributed in the hope that it will be useful, but
14 * WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * General Public License for more details.
20 * Redistribution and use in source and binary forms, with or without
21 * modification, are permitted provided that the following conditions
24 * - Redistributions of source code must retain the above copyright
25 * notice, this list of conditions and the following disclaimer.
26 * - Redistributions in binary form must reproduce the above copyright
27 * notice, this list of conditions and the following disclaimer in
28 * the documentation and/or other materials provided with the
30 * - Neither the name of Intel Corporation nor the names of its
31 * contributors may be used to endorse or promote products derived
32 * from this software without specific prior written permission.
34 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
35 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
36 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
37 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
38 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
39 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
40 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
41 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
42 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
43 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
44 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
48 #include <linux/err.h>
49 #include <linux/vmalloc.h>
50 #include <linux/hash.h>
51 #include <linux/module.h>
52 #include <linux/seq_file.h>
53 #include <rdma/rdma_vt.h>
54 #include <rdma/rdmavt_qp.h>
55 #include <rdma/ib_verbs.h>
60 #include "verbs_txreq.h"
62 unsigned int hfi1_qp_table_size
= 256;
63 module_param_named(qp_table_size
, hfi1_qp_table_size
, uint
, S_IRUGO
);
64 MODULE_PARM_DESC(qp_table_size
, "QP table size");
66 static void flush_tx_list(struct rvt_qp
*qp
);
67 static int iowait_sleep(
68 struct sdma_engine
*sde
,
70 struct sdma_txreq
*stx
,
72 static void iowait_wakeup(struct iowait
*wait
, int reason
);
73 static void iowait_sdma_drained(struct iowait
*wait
);
74 static void qp_pio_drain(struct rvt_qp
*qp
);
76 static inline unsigned mk_qpn(struct rvt_qpn_table
*qpt
,
77 struct rvt_qpn_map
*map
, unsigned off
)
79 return (map
- qpt
->map
) * RVT_BITS_PER_PAGE
+ off
;
83 * Convert the AETH credit code into the number of credits.
85 static const u16 credit_table
[31] = {
119 const struct rvt_operation_params hfi1_post_parms
[RVT_OPERATION_MAX
] = {
120 [IB_WR_RDMA_WRITE
] = {
121 .length
= sizeof(struct ib_rdma_wr
),
122 .qpt_support
= BIT(IB_QPT_UC
) | BIT(IB_QPT_RC
),
125 [IB_WR_RDMA_READ
] = {
126 .length
= sizeof(struct ib_rdma_wr
),
127 .qpt_support
= BIT(IB_QPT_RC
),
128 .flags
= RVT_OPERATION_ATOMIC
,
131 [IB_WR_ATOMIC_CMP_AND_SWP
] = {
132 .length
= sizeof(struct ib_atomic_wr
),
133 .qpt_support
= BIT(IB_QPT_RC
),
134 .flags
= RVT_OPERATION_ATOMIC
| RVT_OPERATION_ATOMIC_SGE
,
137 [IB_WR_ATOMIC_FETCH_AND_ADD
] = {
138 .length
= sizeof(struct ib_atomic_wr
),
139 .qpt_support
= BIT(IB_QPT_RC
),
140 .flags
= RVT_OPERATION_ATOMIC
| RVT_OPERATION_ATOMIC_SGE
,
143 [IB_WR_RDMA_WRITE_WITH_IMM
] = {
144 .length
= sizeof(struct ib_rdma_wr
),
145 .qpt_support
= BIT(IB_QPT_UC
) | BIT(IB_QPT_RC
),
149 .length
= sizeof(struct ib_send_wr
),
150 .qpt_support
= BIT(IB_QPT_UD
) | BIT(IB_QPT_SMI
) | BIT(IB_QPT_GSI
) |
151 BIT(IB_QPT_UC
) | BIT(IB_QPT_RC
),
154 [IB_WR_SEND_WITH_IMM
] = {
155 .length
= sizeof(struct ib_send_wr
),
156 .qpt_support
= BIT(IB_QPT_UD
) | BIT(IB_QPT_SMI
) | BIT(IB_QPT_GSI
) |
157 BIT(IB_QPT_UC
) | BIT(IB_QPT_RC
),
161 .length
= sizeof(struct ib_reg_wr
),
162 .qpt_support
= BIT(IB_QPT_UC
) | BIT(IB_QPT_RC
),
163 .flags
= RVT_OPERATION_LOCAL
,
166 [IB_WR_LOCAL_INV
] = {
167 .length
= sizeof(struct ib_send_wr
),
168 .qpt_support
= BIT(IB_QPT_UC
) | BIT(IB_QPT_RC
),
169 .flags
= RVT_OPERATION_LOCAL
,
172 [IB_WR_SEND_WITH_INV
] = {
173 .length
= sizeof(struct ib_send_wr
),
174 .qpt_support
= BIT(IB_QPT_RC
),
179 static void flush_tx_list(struct rvt_qp
*qp
)
181 struct hfi1_qp_priv
*priv
= qp
->priv
;
183 while (!list_empty(&priv
->s_iowait
.tx_head
)) {
184 struct sdma_txreq
*tx
;
186 tx
= list_first_entry(
187 &priv
->s_iowait
.tx_head
,
190 list_del_init(&tx
->list
);
192 container_of(tx
, struct verbs_txreq
, txreq
));
196 static void flush_iowait(struct rvt_qp
*qp
)
198 struct hfi1_qp_priv
*priv
= qp
->priv
;
199 struct hfi1_ibdev
*dev
= to_idev(qp
->ibqp
.device
);
202 write_seqlock_irqsave(&dev
->iowait_lock
, flags
);
203 if (!list_empty(&priv
->s_iowait
.list
)) {
204 list_del_init(&priv
->s_iowait
.list
);
205 if (atomic_dec_and_test(&qp
->refcount
))
208 write_sequnlock_irqrestore(&dev
->iowait_lock
, flags
);
211 static inline int opa_mtu_enum_to_int(int mtu
)
214 case OPA_MTU_8192
: return 8192;
215 case OPA_MTU_10240
: return 10240;
221 * This function is what we would push to the core layer if we wanted to be a
222 * "first class citizen". Instead we hide this here and rely on Verbs ULPs
223 * to blindly pass the MTU enum value from the PathRecord to us.
225 static inline int verbs_mtu_enum_to_int(struct ib_device
*dev
, enum ib_mtu mtu
)
229 /* Constraining 10KB packets to 8KB packets */
230 if (mtu
== (enum ib_mtu
)OPA_MTU_10240
)
232 val
= opa_mtu_enum_to_int((int)mtu
);
235 return ib_mtu_enum_to_int(mtu
);
238 int hfi1_check_modify_qp(struct rvt_qp
*qp
, struct ib_qp_attr
*attr
,
239 int attr_mask
, struct ib_udata
*udata
)
241 struct ib_qp
*ibqp
= &qp
->ibqp
;
242 struct hfi1_ibdev
*dev
= to_idev(ibqp
->device
);
243 struct hfi1_devdata
*dd
= dd_from_dev(dev
);
246 if (attr_mask
& IB_QP_AV
) {
247 sc
= ah_to_sc(ibqp
->device
, &attr
->ah_attr
);
251 if (!qp_to_sdma_engine(qp
, sc
) &&
252 dd
->flags
& HFI1_HAS_SEND_DMA
)
255 if (!qp_to_send_context(qp
, sc
))
259 if (attr_mask
& IB_QP_ALT_PATH
) {
260 sc
= ah_to_sc(ibqp
->device
, &attr
->alt_ah_attr
);
264 if (!qp_to_sdma_engine(qp
, sc
) &&
265 dd
->flags
& HFI1_HAS_SEND_DMA
)
268 if (!qp_to_send_context(qp
, sc
))
275 void hfi1_modify_qp(struct rvt_qp
*qp
, struct ib_qp_attr
*attr
,
276 int attr_mask
, struct ib_udata
*udata
)
278 struct ib_qp
*ibqp
= &qp
->ibqp
;
279 struct hfi1_qp_priv
*priv
= qp
->priv
;
281 if (attr_mask
& IB_QP_AV
) {
282 priv
->s_sc
= ah_to_sc(ibqp
->device
, &qp
->remote_ah_attr
);
283 priv
->s_sde
= qp_to_sdma_engine(qp
, priv
->s_sc
);
284 priv
->s_sendcontext
= qp_to_send_context(qp
, priv
->s_sc
);
287 if (attr_mask
& IB_QP_PATH_MIG_STATE
&&
288 attr
->path_mig_state
== IB_MIG_MIGRATED
&&
289 qp
->s_mig_state
== IB_MIG_ARMED
) {
290 qp
->s_flags
|= RVT_S_AHG_CLEAR
;
291 priv
->s_sc
= ah_to_sc(ibqp
->device
, &qp
->remote_ah_attr
);
292 priv
->s_sde
= qp_to_sdma_engine(qp
, priv
->s_sc
);
293 priv
->s_sendcontext
= qp_to_send_context(qp
, priv
->s_sc
);
298 * hfi1_check_send_wqe - validate wqe
300 * @wqe - The built wqe
302 * validate wqe. This is called
303 * prior to inserting the wqe into
304 * the ring but after the wqe has been
307 * Returns 0 on success, -EINVAL on failure
310 int hfi1_check_send_wqe(struct rvt_qp
*qp
,
311 struct rvt_swqe
*wqe
)
313 struct hfi1_ibport
*ibp
= to_iport(qp
->ibqp
.device
, qp
->port_num
);
316 switch (qp
->ibqp
.qp_type
) {
319 if (wqe
->length
> 0x80000000U
)
323 ah
= ibah_to_rvtah(wqe
->ud_wr
.ah
);
324 if (wqe
->length
> (1 << ah
->log_pmtu
))
329 ah
= ibah_to_rvtah(wqe
->ud_wr
.ah
);
330 if (wqe
->length
> (1 << ah
->log_pmtu
))
332 if (ibp
->sl_to_sc
[ah
->attr
.sl
] == 0xf)
337 return wqe
->length
<= piothreshold
;
341 * hfi1_compute_aeth - compute the AETH (syndrome + MSN)
342 * @qp: the queue pair to compute the AETH for
346 __be32
hfi1_compute_aeth(struct rvt_qp
*qp
)
348 u32 aeth
= qp
->r_msn
& HFI1_MSN_MASK
;
352 * Shared receive queues don't generate credits.
353 * Set the credit field to the invalid value.
355 aeth
|= HFI1_AETH_CREDIT_INVAL
<< HFI1_AETH_CREDIT_SHIFT
;
359 struct rvt_rwq
*wq
= qp
->r_rq
.wq
;
363 /* sanity check pointers before trusting them */
365 if (head
>= qp
->r_rq
.size
)
368 if (tail
>= qp
->r_rq
.size
)
371 * Compute the number of credits available (RWQEs).
372 * There is a small chance that the pair of reads are
373 * not atomic, which is OK, since the fuzziness is
374 * resolved as further ACKs go out.
376 credits
= head
- tail
;
377 if ((int)credits
< 0)
378 credits
+= qp
->r_rq
.size
;
380 * Binary search the credit table to find the code to
387 if (credit_table
[x
] == credits
)
389 if (credit_table
[x
] > credits
) {
397 aeth
|= x
<< HFI1_AETH_CREDIT_SHIFT
;
399 return cpu_to_be32(aeth
);
403 * _hfi1_schedule_send - schedule progress
406 * This schedules qp progress w/o regard to the s_flags.
408 * It is only used in the post send, which doesn't hold
411 void _hfi1_schedule_send(struct rvt_qp
*qp
)
413 struct hfi1_qp_priv
*priv
= qp
->priv
;
414 struct hfi1_ibport
*ibp
=
415 to_iport(qp
->ibqp
.device
, qp
->port_num
);
416 struct hfi1_pportdata
*ppd
= ppd_from_ibp(ibp
);
417 struct hfi1_devdata
*dd
= dd_from_ibdev(qp
->ibqp
.device
);
419 iowait_schedule(&priv
->s_iowait
, ppd
->hfi1_wq
,
422 cpumask_first(cpumask_of_node(dd
->node
)));
425 static void qp_pio_drain(struct rvt_qp
*qp
)
427 struct hfi1_ibdev
*dev
;
428 struct hfi1_qp_priv
*priv
= qp
->priv
;
430 if (!priv
->s_sendcontext
)
432 dev
= to_idev(qp
->ibqp
.device
);
433 while (iowait_pio_pending(&priv
->s_iowait
)) {
434 write_seqlock_irq(&dev
->iowait_lock
);
435 hfi1_sc_wantpiobuf_intr(priv
->s_sendcontext
, 1);
436 write_sequnlock_irq(&dev
->iowait_lock
);
437 iowait_pio_drain(&priv
->s_iowait
);
438 write_seqlock_irq(&dev
->iowait_lock
);
439 hfi1_sc_wantpiobuf_intr(priv
->s_sendcontext
, 0);
440 write_sequnlock_irq(&dev
->iowait_lock
);
445 * hfi1_schedule_send - schedule progress
448 * This schedules qp progress and caller should hold
451 void hfi1_schedule_send(struct rvt_qp
*qp
)
453 if (hfi1_send_ok(qp
))
454 _hfi1_schedule_send(qp
);
458 * hfi1_get_credit - flush the send work queue of a QP
459 * @qp: the qp who's send work queue to flush
460 * @aeth: the Acknowledge Extended Transport Header
462 * The QP s_lock should be held.
464 void hfi1_get_credit(struct rvt_qp
*qp
, u32 aeth
)
466 u32 credit
= (aeth
>> HFI1_AETH_CREDIT_SHIFT
) & HFI1_AETH_CREDIT_MASK
;
469 * If the credit is invalid, we can send
470 * as many packets as we like. Otherwise, we have to
471 * honor the credit field.
473 if (credit
== HFI1_AETH_CREDIT_INVAL
) {
474 if (!(qp
->s_flags
& RVT_S_UNLIMITED_CREDIT
)) {
475 qp
->s_flags
|= RVT_S_UNLIMITED_CREDIT
;
476 if (qp
->s_flags
& RVT_S_WAIT_SSN_CREDIT
) {
477 qp
->s_flags
&= ~RVT_S_WAIT_SSN_CREDIT
;
478 hfi1_schedule_send(qp
);
481 } else if (!(qp
->s_flags
& RVT_S_UNLIMITED_CREDIT
)) {
482 /* Compute new LSN (i.e., MSN + credit) */
483 credit
= (aeth
+ credit_table
[credit
]) & HFI1_MSN_MASK
;
484 if (cmp_msn(credit
, qp
->s_lsn
) > 0) {
486 if (qp
->s_flags
& RVT_S_WAIT_SSN_CREDIT
) {
487 qp
->s_flags
&= ~RVT_S_WAIT_SSN_CREDIT
;
488 hfi1_schedule_send(qp
);
494 void hfi1_qp_wakeup(struct rvt_qp
*qp
, u32 flag
)
498 spin_lock_irqsave(&qp
->s_lock
, flags
);
499 if (qp
->s_flags
& flag
) {
500 qp
->s_flags
&= ~flag
;
501 trace_hfi1_qpwakeup(qp
, flag
);
502 hfi1_schedule_send(qp
);
504 spin_unlock_irqrestore(&qp
->s_lock
, flags
);
505 /* Notify hfi1_destroy_qp() if it is waiting. */
506 if (atomic_dec_and_test(&qp
->refcount
))
510 static int iowait_sleep(
511 struct sdma_engine
*sde
,
513 struct sdma_txreq
*stx
,
516 struct verbs_txreq
*tx
= container_of(stx
, struct verbs_txreq
, txreq
);
518 struct hfi1_qp_priv
*priv
;
521 struct hfi1_ibdev
*dev
;
526 spin_lock_irqsave(&qp
->s_lock
, flags
);
527 if (ib_rvt_state_ops
[qp
->state
] & RVT_PROCESS_RECV_OK
) {
529 * If we couldn't queue the DMA request, save the info
530 * and try again later rather than destroying the
531 * buffer and undoing the side effects of the copy.
533 /* Make a common routine? */
534 dev
= &sde
->dd
->verbs_dev
;
535 list_add_tail(&stx
->list
, &wait
->tx_head
);
536 write_seqlock(&dev
->iowait_lock
);
537 if (sdma_progress(sde
, seq
, stx
))
539 if (list_empty(&priv
->s_iowait
.list
)) {
540 struct hfi1_ibport
*ibp
=
541 to_iport(qp
->ibqp
.device
, qp
->port_num
);
543 ibp
->rvp
.n_dmawait
++;
544 qp
->s_flags
|= RVT_S_WAIT_DMA_DESC
;
545 list_add_tail(&priv
->s_iowait
.list
, &sde
->dmawait
);
546 trace_hfi1_qpsleep(qp
, RVT_S_WAIT_DMA_DESC
);
547 atomic_inc(&qp
->refcount
);
549 write_sequnlock(&dev
->iowait_lock
);
550 qp
->s_flags
&= ~RVT_S_BUSY
;
551 spin_unlock_irqrestore(&qp
->s_lock
, flags
);
554 spin_unlock_irqrestore(&qp
->s_lock
, flags
);
559 write_sequnlock(&dev
->iowait_lock
);
560 spin_unlock_irqrestore(&qp
->s_lock
, flags
);
561 list_del_init(&stx
->list
);
565 static void iowait_wakeup(struct iowait
*wait
, int reason
)
567 struct rvt_qp
*qp
= iowait_to_qp(wait
);
569 WARN_ON(reason
!= SDMA_AVAIL_REASON
);
570 hfi1_qp_wakeup(qp
, RVT_S_WAIT_DMA_DESC
);
573 static void iowait_sdma_drained(struct iowait
*wait
)
575 struct rvt_qp
*qp
= iowait_to_qp(wait
);
579 * This happens when the send engine notes
580 * a QP in the error state and cannot
581 * do the flush work until that QP's
582 * sdma work has finished.
584 spin_lock_irqsave(&qp
->s_lock
, flags
);
585 if (qp
->s_flags
& RVT_S_WAIT_DMA
) {
586 qp
->s_flags
&= ~RVT_S_WAIT_DMA
;
587 hfi1_schedule_send(qp
);
589 spin_unlock_irqrestore(&qp
->s_lock
, flags
);
594 * qp_to_sdma_engine - map a qp to a send engine
599 * A send engine for the qp or NULL for SMI type qp.
601 struct sdma_engine
*qp_to_sdma_engine(struct rvt_qp
*qp
, u8 sc5
)
603 struct hfi1_devdata
*dd
= dd_from_ibdev(qp
->ibqp
.device
);
604 struct sdma_engine
*sde
;
606 if (!(dd
->flags
& HFI1_HAS_SEND_DMA
))
608 switch (qp
->ibqp
.qp_type
) {
614 sde
= sdma_select_engine_sc(dd
, qp
->ibqp
.qp_num
>> dd
->qos_shift
, sc5
);
619 * qp_to_send_context - map a qp to a send context
624 * A send context for the qp
626 struct send_context
*qp_to_send_context(struct rvt_qp
*qp
, u8 sc5
)
628 struct hfi1_devdata
*dd
= dd_from_ibdev(qp
->ibqp
.device
);
630 switch (qp
->ibqp
.qp_type
) {
632 /* SMA packets to VL15 */
633 return dd
->vld
[15].sc
;
638 return pio_select_send_context_sc(dd
, qp
->ibqp
.qp_num
>> dd
->qos_shift
,
643 struct hfi1_ibdev
*dev
;
649 struct qp_iter
*qp_iter_init(struct hfi1_ibdev
*dev
)
651 struct qp_iter
*iter
;
653 iter
= kzalloc(sizeof(*iter
), GFP_KERNEL
);
658 iter
->specials
= dev
->rdi
.ibdev
.phys_port_cnt
* 2;
659 if (qp_iter_next(iter
)) {
667 int qp_iter_next(struct qp_iter
*iter
)
669 struct hfi1_ibdev
*dev
= iter
->dev
;
672 struct rvt_qp
*pqp
= iter
->qp
;
676 * The approach is to consider the special qps
677 * as an additional table entries before the
678 * real hash table. Since the qp code sets
679 * the qp->next hash link to NULL, this works just fine.
681 * iter->specials is 2 * # ports
683 * n = 0..iter->specials is the special qp indices
685 * n = iter->specials..dev->rdi.qp_dev->qp_table_size+iter->specials are
686 * the potential hash bucket entries
689 for (; n
< dev
->rdi
.qp_dev
->qp_table_size
+ iter
->specials
; n
++) {
691 qp
= rcu_dereference(pqp
->next
);
693 if (n
< iter
->specials
) {
694 struct hfi1_pportdata
*ppd
;
695 struct hfi1_ibport
*ibp
;
698 pidx
= n
% dev
->rdi
.ibdev
.phys_port_cnt
;
699 ppd
= &dd_from_dev(dev
)->pport
[pidx
];
700 ibp
= &ppd
->ibport_data
;
703 qp
= rcu_dereference(ibp
->rvp
.qp
[0]);
705 qp
= rcu_dereference(ibp
->rvp
.qp
[1]);
707 qp
= rcu_dereference(
708 dev
->rdi
.qp_dev
->qp_table
[
709 (n
- iter
->specials
)]);
722 static const char * const qp_type_str
[] = {
723 "SMI", "GSI", "RC", "UC", "UD",
726 static int qp_idle(struct rvt_qp
*qp
)
729 qp
->s_last
== qp
->s_acked
&&
730 qp
->s_acked
== qp
->s_cur
&&
731 qp
->s_cur
== qp
->s_tail
&&
732 qp
->s_tail
== qp
->s_head
;
735 void qp_iter_print(struct seq_file
*s
, struct qp_iter
*iter
)
737 struct rvt_swqe
*wqe
;
738 struct rvt_qp
*qp
= iter
->qp
;
739 struct hfi1_qp_priv
*priv
= qp
->priv
;
740 struct sdma_engine
*sde
;
741 struct send_context
*send_context
;
743 sde
= qp_to_sdma_engine(qp
, priv
->s_sc
);
744 wqe
= rvt_get_swqe_ptr(qp
, qp
->s_last
);
745 send_context
= qp_to_send_context(qp
, priv
->s_sc
);
747 "N %d %s QP %x R %u %s %u %u %u f=%x %u %u %u %u %u %u PSN %x %x %x %x %x (%u %u %u %u %u %u %u) RQP %x LID %x SL %u MTU %u %u %u %u SDE %p,%u SC %p,%u SCQ %u %u PID %d\n",
749 qp_idle(qp
) ? "I" : "B",
751 atomic_read(&qp
->refcount
),
752 qp_type_str
[qp
->ibqp
.qp_type
],
754 wqe
? wqe
->wr
.opcode
: 0,
757 iowait_sdma_pending(&priv
->s_iowait
),
758 iowait_pio_pending(&priv
->s_iowait
),
759 !list_empty(&priv
->s_iowait
.list
),
764 qp
->s_psn
, qp
->s_next_psn
,
765 qp
->s_sending_psn
, qp
->s_sending_hpsn
,
766 qp
->s_last
, qp
->s_acked
, qp
->s_cur
,
767 qp
->s_tail
, qp
->s_head
, qp
->s_size
,
770 qp
->remote_ah_attr
.dlid
,
771 qp
->remote_ah_attr
.sl
,
777 sde
? sde
->this_idx
: 0,
779 send_context
? send_context
->sw_index
: 0,
780 ibcq_to_rvtcq(qp
->ibqp
.send_cq
)->queue
->head
,
781 ibcq_to_rvtcq(qp
->ibqp
.send_cq
)->queue
->tail
,
785 void qp_comm_est(struct rvt_qp
*qp
)
787 qp
->r_flags
|= RVT_R_COMM_EST
;
788 if (qp
->ibqp
.event_handler
) {
791 ev
.device
= qp
->ibqp
.device
;
792 ev
.element
.qp
= &qp
->ibqp
;
793 ev
.event
= IB_EVENT_COMM_EST
;
794 qp
->ibqp
.event_handler(&ev
, qp
->ibqp
.qp_context
);
798 void *qp_priv_alloc(struct rvt_dev_info
*rdi
, struct rvt_qp
*qp
,
801 struct hfi1_qp_priv
*priv
;
803 priv
= kzalloc_node(sizeof(*priv
), gfp
, rdi
->dparms
.node
);
805 return ERR_PTR(-ENOMEM
);
809 priv
->s_ahg
= kzalloc_node(sizeof(*priv
->s_ahg
), gfp
,
813 return ERR_PTR(-ENOMEM
);
815 setup_timer(&priv
->s_rnr_timer
, hfi1_rc_rnr_retry
, (unsigned long)qp
);
816 qp
->s_timer
.function
= hfi1_rc_timeout
;
820 void qp_priv_free(struct rvt_dev_info
*rdi
, struct rvt_qp
*qp
)
822 struct hfi1_qp_priv
*priv
= qp
->priv
;
828 unsigned free_all_qps(struct rvt_dev_info
*rdi
)
830 struct hfi1_ibdev
*verbs_dev
= container_of(rdi
,
833 struct hfi1_devdata
*dd
= container_of(verbs_dev
,
837 unsigned qp_inuse
= 0;
839 for (n
= 0; n
< dd
->num_pports
; n
++) {
840 struct hfi1_ibport
*ibp
= &dd
->pport
[n
].ibport_data
;
843 if (rcu_dereference(ibp
->rvp
.qp
[0]))
845 if (rcu_dereference(ibp
->rvp
.qp
[1]))
853 void flush_qp_waiters(struct rvt_qp
*qp
)
856 hfi1_stop_rc_timers(qp
);
859 void stop_send_queue(struct rvt_qp
*qp
)
861 struct hfi1_qp_priv
*priv
= qp
->priv
;
863 cancel_work_sync(&priv
->s_iowait
.iowork
);
864 hfi1_del_timers_sync(qp
);
867 void quiesce_qp(struct rvt_qp
*qp
)
869 struct hfi1_qp_priv
*priv
= qp
->priv
;
871 iowait_sdma_drain(&priv
->s_iowait
);
876 void notify_qp_reset(struct rvt_qp
*qp
)
878 struct hfi1_qp_priv
*priv
= qp
->priv
;
886 iowait_sdma_drained
);
887 priv
->r_adefered
= 0;
892 * Switch to alternate path.
893 * The QP s_lock should be held and interrupts disabled.
895 void hfi1_migrate_qp(struct rvt_qp
*qp
)
897 struct hfi1_qp_priv
*priv
= qp
->priv
;
900 qp
->s_mig_state
= IB_MIG_MIGRATED
;
901 qp
->remote_ah_attr
= qp
->alt_ah_attr
;
902 qp
->port_num
= qp
->alt_ah_attr
.port_num
;
903 qp
->s_pkey_index
= qp
->s_alt_pkey_index
;
904 qp
->s_flags
|= RVT_S_AHG_CLEAR
;
905 priv
->s_sc
= ah_to_sc(qp
->ibqp
.device
, &qp
->remote_ah_attr
);
906 priv
->s_sde
= qp_to_sdma_engine(qp
, priv
->s_sc
);
908 ev
.device
= qp
->ibqp
.device
;
909 ev
.element
.qp
= &qp
->ibqp
;
910 ev
.event
= IB_EVENT_PATH_MIG
;
911 qp
->ibqp
.event_handler(&ev
, qp
->ibqp
.qp_context
);
914 int mtu_to_path_mtu(u32 mtu
)
916 return mtu_to_enum(mtu
, OPA_MTU_8192
);
919 u32
mtu_from_qp(struct rvt_dev_info
*rdi
, struct rvt_qp
*qp
, u32 pmtu
)
922 struct hfi1_ibdev
*verbs_dev
= container_of(rdi
,
925 struct hfi1_devdata
*dd
= container_of(verbs_dev
,
928 struct hfi1_ibport
*ibp
;
931 ibp
= &dd
->pport
[qp
->port_num
- 1].ibport_data
;
932 sc
= ibp
->sl_to_sc
[qp
->remote_ah_attr
.sl
];
933 vl
= sc_to_vlt(dd
, sc
);
935 mtu
= verbs_mtu_enum_to_int(qp
->ibqp
.device
, pmtu
);
936 if (vl
< PER_VL_SEND_CONTEXTS
)
937 mtu
= min_t(u32
, mtu
, dd
->vld
[vl
].mtu
);
941 int get_pmtu_from_attr(struct rvt_dev_info
*rdi
, struct rvt_qp
*qp
,
942 struct ib_qp_attr
*attr
)
944 int mtu
, pidx
= qp
->port_num
- 1;
945 struct hfi1_ibdev
*verbs_dev
= container_of(rdi
,
948 struct hfi1_devdata
*dd
= container_of(verbs_dev
,
951 mtu
= verbs_mtu_enum_to_int(qp
->ibqp
.device
, attr
->path_mtu
);
953 return -1; /* values less than 0 are error */
955 if (mtu
> dd
->pport
[pidx
].ibmtu
)
956 return mtu_to_enum(dd
->pport
[pidx
].ibmtu
, IB_MTU_2048
);
958 return attr
->path_mtu
;
961 void notify_error_qp(struct rvt_qp
*qp
)
963 struct hfi1_ibdev
*dev
= to_idev(qp
->ibqp
.device
);
964 struct hfi1_qp_priv
*priv
= qp
->priv
;
966 write_seqlock(&dev
->iowait_lock
);
967 if (!list_empty(&priv
->s_iowait
.list
) && !(qp
->s_flags
& RVT_S_BUSY
)) {
968 qp
->s_flags
&= ~RVT_S_ANY_WAIT_IO
;
969 list_del_init(&priv
->s_iowait
.list
);
970 if (atomic_dec_and_test(&qp
->refcount
))
973 write_sequnlock(&dev
->iowait_lock
);
975 if (!(qp
->s_flags
& RVT_S_BUSY
)) {
978 rvt_put_mr(qp
->s_rdma_mr
);
979 qp
->s_rdma_mr
= NULL
;
986 * hfi1_error_port_qps - put a port's RC/UC qps into error state
988 * @sl: the service level.
990 * This function places all RC/UC qps with a given service level into error
991 * state. It is generally called to force upper lay apps to abandon stale qps
992 * after an sl->sc mapping change.
994 void hfi1_error_port_qps(struct hfi1_ibport
*ibp
, u8 sl
)
996 struct rvt_qp
*qp
= NULL
;
997 struct hfi1_pportdata
*ppd
= ppd_from_ibp(ibp
);
998 struct hfi1_ibdev
*dev
= &ppd
->dd
->verbs_dev
;
1005 /* Deal only with RC/UC qps that use the given SL. */
1006 for (n
= 0; n
< dev
->rdi
.qp_dev
->qp_table_size
; n
++) {
1007 for (qp
= rcu_dereference(dev
->rdi
.qp_dev
->qp_table
[n
]); qp
;
1008 qp
= rcu_dereference(qp
->next
)) {
1009 if (qp
->port_num
== ppd
->port
&&
1010 (qp
->ibqp
.qp_type
== IB_QPT_UC
||
1011 qp
->ibqp
.qp_type
== IB_QPT_RC
) &&
1012 qp
->remote_ah_attr
.sl
== sl
&&
1013 (ib_rvt_state_ops
[qp
->state
] &
1014 RVT_POST_SEND_OK
)) {
1015 spin_lock_irq(&qp
->r_lock
);
1016 spin_lock(&qp
->s_hlock
);
1017 spin_lock(&qp
->s_lock
);
1018 lastwqe
= rvt_error_qp(qp
,
1019 IB_WC_WR_FLUSH_ERR
);
1020 spin_unlock(&qp
->s_lock
);
1021 spin_unlock(&qp
->s_hlock
);
1022 spin_unlock_irq(&qp
->r_lock
);
1024 ev
.device
= qp
->ibqp
.device
;
1025 ev
.element
.qp
= &qp
->ibqp
;
1027 IB_EVENT_QP_LAST_WQE_REACHED
;
1028 qp
->ibqp
.event_handler(&ev
,
1029 qp
->ibqp
.qp_context
);