2 * Copyright (c) 2004 Topspin Communications. All rights reserved.
3 * Copyright (c) 2005, 2006, 2007 Cisco Systems, Inc. All rights reserved.
4 * Copyright (c) 2005, 2006, 2007, 2008 Mellanox Technologies. All rights reserved.
5 * Copyright (c) 2004 Voltaire, Inc. All rights reserved.
7 * This software is available to you under a choice of one of two
8 * licenses. You may choose to be licensed under the terms of the GNU
9 * General Public License (GPL) Version 2, available from the file
10 * COPYING in the main directory of this source tree, or the
11 * OpenIB.org BSD license below:
13 * Redistribution and use in source and binary forms, with or
14 * without modification, are permitted provided that the following
17 * - Redistributions of source code must retain the above
18 * copyright notice, this list of conditions and the following
21 * - Redistributions in binary form must reproduce the above
22 * copyright notice, this list of conditions and the following
23 * disclaimer in the documentation and/or other materials
24 * provided with the distribution.
26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
27 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
28 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
29 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
30 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
31 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
32 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
36 #include <linux/gfp.h>
37 #include <linux/export.h>
39 #include <linux/mlx4/cmd.h>
40 #include <linux/mlx4/qp.h>
45 /* QP to support BF should have bits 6,7 cleared */
46 #define MLX4_BF_QP_SKIP_MASK 0xc0
47 #define MLX4_MAX_BF_QP_RANGE 0x40
49 void mlx4_qp_event(struct mlx4_dev
*dev
, u32 qpn
, int event_type
)
51 struct mlx4_qp_table
*qp_table
= &mlx4_priv(dev
)->qp_table
;
54 spin_lock(&qp_table
->lock
);
56 qp
= __mlx4_qp_lookup(dev
, qpn
);
58 atomic_inc(&qp
->refcount
);
60 spin_unlock(&qp_table
->lock
);
63 mlx4_dbg(dev
, "Async event for none existent QP %08x\n", qpn
);
67 qp
->event(qp
, event_type
);
69 if (atomic_dec_and_test(&qp
->refcount
))
73 /* used for INIT/CLOSE port logic */
74 static int is_master_qp0(struct mlx4_dev
*dev
, struct mlx4_qp
*qp
, int *real_qp0
, int *proxy_qp0
)
76 /* this procedure is called after we already know we are on the master */
77 /* qp0 is either the proxy qp0, or the real qp0 */
78 u32 pf_proxy_offset
= dev
->phys_caps
.base_proxy_sqpn
+ 8 * mlx4_master_func_num(dev
);
79 *proxy_qp0
= qp
->qpn
>= pf_proxy_offset
&& qp
->qpn
<= pf_proxy_offset
+ 1;
81 *real_qp0
= qp
->qpn
>= dev
->phys_caps
.base_sqpn
&&
82 qp
->qpn
<= dev
->phys_caps
.base_sqpn
+ 1;
84 return *real_qp0
|| *proxy_qp0
;
87 static int __mlx4_qp_modify(struct mlx4_dev
*dev
, struct mlx4_mtt
*mtt
,
88 enum mlx4_qp_state cur_state
, enum mlx4_qp_state new_state
,
89 struct mlx4_qp_context
*context
,
90 enum mlx4_qp_optpar optpar
,
91 int sqd_event
, struct mlx4_qp
*qp
, int native
)
93 static const u16 op
[MLX4_QP_NUM_STATE
][MLX4_QP_NUM_STATE
] = {
94 [MLX4_QP_STATE_RST
] = {
95 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
96 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
97 [MLX4_QP_STATE_INIT
] = MLX4_CMD_RST2INIT_QP
,
99 [MLX4_QP_STATE_INIT
] = {
100 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
101 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
102 [MLX4_QP_STATE_INIT
] = MLX4_CMD_INIT2INIT_QP
,
103 [MLX4_QP_STATE_RTR
] = MLX4_CMD_INIT2RTR_QP
,
105 [MLX4_QP_STATE_RTR
] = {
106 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
107 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
108 [MLX4_QP_STATE_RTS
] = MLX4_CMD_RTR2RTS_QP
,
110 [MLX4_QP_STATE_RTS
] = {
111 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
112 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
113 [MLX4_QP_STATE_RTS
] = MLX4_CMD_RTS2RTS_QP
,
114 [MLX4_QP_STATE_SQD
] = MLX4_CMD_RTS2SQD_QP
,
116 [MLX4_QP_STATE_SQD
] = {
117 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
118 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
119 [MLX4_QP_STATE_RTS
] = MLX4_CMD_SQD2RTS_QP
,
120 [MLX4_QP_STATE_SQD
] = MLX4_CMD_SQD2SQD_QP
,
122 [MLX4_QP_STATE_SQER
] = {
123 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
124 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
125 [MLX4_QP_STATE_RTS
] = MLX4_CMD_SQERR2RTS_QP
,
127 [MLX4_QP_STATE_ERR
] = {
128 [MLX4_QP_STATE_RST
] = MLX4_CMD_2RST_QP
,
129 [MLX4_QP_STATE_ERR
] = MLX4_CMD_2ERR_QP
,
133 struct mlx4_priv
*priv
= mlx4_priv(dev
);
134 struct mlx4_cmd_mailbox
*mailbox
;
140 if (cur_state
>= MLX4_QP_NUM_STATE
|| new_state
>= MLX4_QP_NUM_STATE
||
141 !op
[cur_state
][new_state
])
144 if (op
[cur_state
][new_state
] == MLX4_CMD_2RST_QP
) {
145 ret
= mlx4_cmd(dev
, 0, qp
->qpn
, 2,
146 MLX4_CMD_2RST_QP
, MLX4_CMD_TIME_CLASS_A
, native
);
147 if (mlx4_is_master(dev
) && cur_state
!= MLX4_QP_STATE_ERR
&&
148 cur_state
!= MLX4_QP_STATE_RST
&&
149 is_master_qp0(dev
, qp
, &real_qp0
, &proxy_qp0
)) {
150 port
= (qp
->qpn
& 1) + 1;
152 priv
->mfunc
.master
.qp0_state
[port
].proxy_qp0_active
= 0;
154 priv
->mfunc
.master
.qp0_state
[port
].qp0_active
= 0;
159 mailbox
= mlx4_alloc_cmd_mailbox(dev
);
161 return PTR_ERR(mailbox
);
163 if (cur_state
== MLX4_QP_STATE_RST
&& new_state
== MLX4_QP_STATE_INIT
) {
164 u64 mtt_addr
= mlx4_mtt_addr(dev
, mtt
);
165 context
->mtt_base_addr_h
= mtt_addr
>> 32;
166 context
->mtt_base_addr_l
= cpu_to_be32(mtt_addr
& 0xffffffff);
167 context
->log_page_size
= mtt
->page_shift
- MLX4_ICM_PAGE_SHIFT
;
170 if ((cur_state
== MLX4_QP_STATE_RTR
) &&
171 (new_state
== MLX4_QP_STATE_RTS
) &&
172 dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_ROCE_V1_V2
)
173 context
->roce_entropy
=
174 cpu_to_be16(mlx4_qp_roce_entropy(dev
, qp
->qpn
));
176 *(__be32
*) mailbox
->buf
= cpu_to_be32(optpar
);
177 memcpy(mailbox
->buf
+ 8, context
, sizeof *context
);
179 ((struct mlx4_qp_context
*) (mailbox
->buf
+ 8))->local_qpn
=
180 cpu_to_be32(qp
->qpn
);
182 ret
= mlx4_cmd(dev
, mailbox
->dma
,
183 qp
->qpn
| (!!sqd_event
<< 31),
184 new_state
== MLX4_QP_STATE_RST
? 2 : 0,
185 op
[cur_state
][new_state
], MLX4_CMD_TIME_CLASS_C
, native
);
187 if (mlx4_is_master(dev
) && is_master_qp0(dev
, qp
, &real_qp0
, &proxy_qp0
)) {
188 port
= (qp
->qpn
& 1) + 1;
189 if (cur_state
!= MLX4_QP_STATE_ERR
&&
190 cur_state
!= MLX4_QP_STATE_RST
&&
191 new_state
== MLX4_QP_STATE_ERR
) {
193 priv
->mfunc
.master
.qp0_state
[port
].proxy_qp0_active
= 0;
195 priv
->mfunc
.master
.qp0_state
[port
].qp0_active
= 0;
196 } else if (new_state
== MLX4_QP_STATE_RTR
) {
198 priv
->mfunc
.master
.qp0_state
[port
].proxy_qp0_active
= 1;
200 priv
->mfunc
.master
.qp0_state
[port
].qp0_active
= 1;
204 mlx4_free_cmd_mailbox(dev
, mailbox
);
208 int mlx4_qp_modify(struct mlx4_dev
*dev
, struct mlx4_mtt
*mtt
,
209 enum mlx4_qp_state cur_state
, enum mlx4_qp_state new_state
,
210 struct mlx4_qp_context
*context
,
211 enum mlx4_qp_optpar optpar
,
212 int sqd_event
, struct mlx4_qp
*qp
)
214 return __mlx4_qp_modify(dev
, mtt
, cur_state
, new_state
, context
,
215 optpar
, sqd_event
, qp
, 0);
217 EXPORT_SYMBOL_GPL(mlx4_qp_modify
);
219 int __mlx4_qp_reserve_range(struct mlx4_dev
*dev
, int cnt
, int align
,
223 int bf_qp
= !!(flags
& (u8
)MLX4_RESERVE_ETH_BF_QP
);
225 struct mlx4_priv
*priv
= mlx4_priv(dev
);
226 struct mlx4_qp_table
*qp_table
= &priv
->qp_table
;
228 if (cnt
> MLX4_MAX_BF_QP_RANGE
&& bf_qp
)
231 uid
= MLX4_QP_TABLE_ZONE_GENERAL
;
232 if (flags
& (u8
)MLX4_RESERVE_A0_QP
) {
234 uid
= MLX4_QP_TABLE_ZONE_RAW_ETH
;
236 uid
= MLX4_QP_TABLE_ZONE_RSS
;
239 *base
= mlx4_zone_alloc_entries(qp_table
->zones
, uid
, cnt
, align
,
240 bf_qp
? MLX4_BF_QP_SKIP_MASK
: 0, NULL
);
247 int mlx4_qp_reserve_range(struct mlx4_dev
*dev
, int cnt
, int align
,
254 /* Turn off all unsupported QP allocation flags */
255 flags
&= dev
->caps
.alloc_res_qp_mask
;
257 if (mlx4_is_mfunc(dev
)) {
258 set_param_l(&in_param
, (((u32
)flags
) << 24) | (u32
)cnt
);
259 set_param_h(&in_param
, align
);
260 err
= mlx4_cmd_imm(dev
, in_param
, &out_param
,
261 RES_QP
, RES_OP_RESERVE
,
263 MLX4_CMD_TIME_CLASS_A
, MLX4_CMD_WRAPPED
);
267 *base
= get_param_l(&out_param
);
270 return __mlx4_qp_reserve_range(dev
, cnt
, align
, base
, flags
);
272 EXPORT_SYMBOL_GPL(mlx4_qp_reserve_range
);
274 void __mlx4_qp_release_range(struct mlx4_dev
*dev
, int base_qpn
, int cnt
)
276 struct mlx4_priv
*priv
= mlx4_priv(dev
);
277 struct mlx4_qp_table
*qp_table
= &priv
->qp_table
;
279 if (mlx4_is_qp_reserved(dev
, (u32
) base_qpn
))
281 mlx4_zone_free_entries_unique(qp_table
->zones
, base_qpn
, cnt
);
284 void mlx4_qp_release_range(struct mlx4_dev
*dev
, int base_qpn
, int cnt
)
289 if (mlx4_is_mfunc(dev
)) {
290 set_param_l(&in_param
, base_qpn
);
291 set_param_h(&in_param
, cnt
);
292 err
= mlx4_cmd(dev
, in_param
, RES_QP
, RES_OP_RESERVE
,
294 MLX4_CMD_TIME_CLASS_A
, MLX4_CMD_WRAPPED
);
296 mlx4_warn(dev
, "Failed to release qp range base:%d cnt:%d\n",
300 __mlx4_qp_release_range(dev
, base_qpn
, cnt
);
302 EXPORT_SYMBOL_GPL(mlx4_qp_release_range
);
304 int __mlx4_qp_alloc_icm(struct mlx4_dev
*dev
, int qpn
, gfp_t gfp
)
306 struct mlx4_priv
*priv
= mlx4_priv(dev
);
307 struct mlx4_qp_table
*qp_table
= &priv
->qp_table
;
310 err
= mlx4_table_get(dev
, &qp_table
->qp_table
, qpn
, gfp
);
314 err
= mlx4_table_get(dev
, &qp_table
->auxc_table
, qpn
, gfp
);
318 err
= mlx4_table_get(dev
, &qp_table
->altc_table
, qpn
, gfp
);
322 err
= mlx4_table_get(dev
, &qp_table
->rdmarc_table
, qpn
, gfp
);
326 err
= mlx4_table_get(dev
, &qp_table
->cmpt_table
, qpn
, gfp
);
333 mlx4_table_put(dev
, &qp_table
->rdmarc_table
, qpn
);
336 mlx4_table_put(dev
, &qp_table
->altc_table
, qpn
);
339 mlx4_table_put(dev
, &qp_table
->auxc_table
, qpn
);
342 mlx4_table_put(dev
, &qp_table
->qp_table
, qpn
);
348 static int mlx4_qp_alloc_icm(struct mlx4_dev
*dev
, int qpn
, gfp_t gfp
)
352 if (mlx4_is_mfunc(dev
)) {
353 set_param_l(¶m
, qpn
);
354 return mlx4_cmd_imm(dev
, param
, ¶m
, RES_QP
, RES_OP_MAP_ICM
,
355 MLX4_CMD_ALLOC_RES
, MLX4_CMD_TIME_CLASS_A
,
358 return __mlx4_qp_alloc_icm(dev
, qpn
, gfp
);
361 void __mlx4_qp_free_icm(struct mlx4_dev
*dev
, int qpn
)
363 struct mlx4_priv
*priv
= mlx4_priv(dev
);
364 struct mlx4_qp_table
*qp_table
= &priv
->qp_table
;
366 mlx4_table_put(dev
, &qp_table
->cmpt_table
, qpn
);
367 mlx4_table_put(dev
, &qp_table
->rdmarc_table
, qpn
);
368 mlx4_table_put(dev
, &qp_table
->altc_table
, qpn
);
369 mlx4_table_put(dev
, &qp_table
->auxc_table
, qpn
);
370 mlx4_table_put(dev
, &qp_table
->qp_table
, qpn
);
373 static void mlx4_qp_free_icm(struct mlx4_dev
*dev
, int qpn
)
377 if (mlx4_is_mfunc(dev
)) {
378 set_param_l(&in_param
, qpn
);
379 if (mlx4_cmd(dev
, in_param
, RES_QP
, RES_OP_MAP_ICM
,
380 MLX4_CMD_FREE_RES
, MLX4_CMD_TIME_CLASS_A
,
382 mlx4_warn(dev
, "Failed to free icm of qp:%d\n", qpn
);
384 __mlx4_qp_free_icm(dev
, qpn
);
387 int mlx4_qp_alloc(struct mlx4_dev
*dev
, int qpn
, struct mlx4_qp
*qp
, gfp_t gfp
)
389 struct mlx4_priv
*priv
= mlx4_priv(dev
);
390 struct mlx4_qp_table
*qp_table
= &priv
->qp_table
;
398 err
= mlx4_qp_alloc_icm(dev
, qpn
, gfp
);
402 spin_lock_irq(&qp_table
->lock
);
403 err
= radix_tree_insert(&dev
->qp_table_tree
, qp
->qpn
&
404 (dev
->caps
.num_qps
- 1), qp
);
405 spin_unlock_irq(&qp_table
->lock
);
409 atomic_set(&qp
->refcount
, 1);
410 init_completion(&qp
->free
);
415 mlx4_qp_free_icm(dev
, qpn
);
419 EXPORT_SYMBOL_GPL(mlx4_qp_alloc
);
421 int mlx4_update_qp(struct mlx4_dev
*dev
, u32 qpn
,
422 enum mlx4_update_qp_attr attr
,
423 struct mlx4_update_qp_params
*params
)
425 struct mlx4_cmd_mailbox
*mailbox
;
426 struct mlx4_update_qp_context
*cmd
;
427 u64 pri_addr_path_mask
= 0;
431 if (!attr
|| (attr
& ~MLX4_UPDATE_QP_SUPPORTED_ATTRS
))
434 mailbox
= mlx4_alloc_cmd_mailbox(dev
);
436 return PTR_ERR(mailbox
);
438 cmd
= (struct mlx4_update_qp_context
*)mailbox
->buf
;
440 if (attr
& MLX4_UPDATE_QP_SMAC
) {
441 pri_addr_path_mask
|= 1ULL << MLX4_UPD_QP_PATH_MASK_MAC_INDEX
;
442 cmd
->qp_context
.pri_path
.grh_mylmc
= params
->smac_index
;
445 if (attr
& MLX4_UPDATE_QP_ETH_SRC_CHECK_MC_LB
) {
446 if (!(dev
->caps
.flags2
447 & MLX4_DEV_CAP_FLAG2_UPDATE_QP_SRC_CHECK_LB
)) {
449 "Trying to set src check LB, but it isn't supported\n");
453 pri_addr_path_mask
|=
454 1ULL << MLX4_UPD_QP_PATH_MASK_ETH_SRC_CHECK_MC_LB
;
456 MLX4_UPDATE_QP_PARAMS_FLAGS_ETH_CHECK_MC_LB
) {
457 cmd
->qp_context
.pri_path
.fl
|=
458 MLX4_FL_ETH_SRC_CHECK_MC_LB
;
462 if (attr
& MLX4_UPDATE_QP_VSD
) {
463 qp_mask
|= 1ULL << MLX4_UPD_QP_MASK_VSD
;
464 if (params
->flags
& MLX4_UPDATE_QP_PARAMS_FLAGS_VSD_ENABLE
)
465 cmd
->qp_context
.param3
|= cpu_to_be32(MLX4_STRIP_VLAN
);
468 if (attr
& MLX4_UPDATE_QP_RATE_LIMIT
) {
469 qp_mask
|= 1ULL << MLX4_UPD_QP_MASK_RATE_LIMIT
;
470 cmd
->qp_context
.rate_limit_params
= cpu_to_be16((params
->rate_unit
<< 14) | params
->rate_val
);
473 if (attr
& MLX4_UPDATE_QP_QOS_VPORT
) {
474 qp_mask
|= 1ULL << MLX4_UPD_QP_MASK_QOS_VPP
;
475 cmd
->qp_context
.qos_vport
= params
->qos_vport
;
478 cmd
->primary_addr_path_mask
= cpu_to_be64(pri_addr_path_mask
);
479 cmd
->qp_mask
= cpu_to_be64(qp_mask
);
481 err
= mlx4_cmd(dev
, mailbox
->dma
, qpn
& 0xffffff, 0,
482 MLX4_CMD_UPDATE_QP
, MLX4_CMD_TIME_CLASS_A
,
485 mlx4_free_cmd_mailbox(dev
, mailbox
);
488 EXPORT_SYMBOL_GPL(mlx4_update_qp
);
490 void mlx4_qp_remove(struct mlx4_dev
*dev
, struct mlx4_qp
*qp
)
492 struct mlx4_qp_table
*qp_table
= &mlx4_priv(dev
)->qp_table
;
495 spin_lock_irqsave(&qp_table
->lock
, flags
);
496 radix_tree_delete(&dev
->qp_table_tree
, qp
->qpn
& (dev
->caps
.num_qps
- 1));
497 spin_unlock_irqrestore(&qp_table
->lock
, flags
);
499 EXPORT_SYMBOL_GPL(mlx4_qp_remove
);
501 void mlx4_qp_free(struct mlx4_dev
*dev
, struct mlx4_qp
*qp
)
503 if (atomic_dec_and_test(&qp
->refcount
))
505 wait_for_completion(&qp
->free
);
507 mlx4_qp_free_icm(dev
, qp
->qpn
);
509 EXPORT_SYMBOL_GPL(mlx4_qp_free
);
511 static int mlx4_CONF_SPECIAL_QP(struct mlx4_dev
*dev
, u32 base_qpn
)
513 return mlx4_cmd(dev
, 0, base_qpn
, 0, MLX4_CMD_CONF_SPECIAL_QP
,
514 MLX4_CMD_TIME_CLASS_B
, MLX4_CMD_NATIVE
);
517 #define MLX4_QP_TABLE_RSS_ETH_PRIORITY 2
518 #define MLX4_QP_TABLE_RAW_ETH_PRIORITY 1
519 #define MLX4_QP_TABLE_RAW_ETH_SIZE 256
521 static int mlx4_create_zones(struct mlx4_dev
*dev
,
522 u32 reserved_bottom_general
,
523 u32 reserved_top_general
,
524 u32 reserved_bottom_rss
,
525 u32 start_offset_rss
,
526 u32 max_table_offset
)
528 struct mlx4_qp_table
*qp_table
= &mlx4_priv(dev
)->qp_table
;
529 struct mlx4_bitmap (*bitmap
)[MLX4_QP_TABLE_ZONE_NUM
] = NULL
;
530 int bitmap_initialized
= 0;
535 qp_table
->zones
= mlx4_zone_allocator_create(MLX4_ZONE_ALLOC_FLAGS_NO_OVERLAP
);
537 if (NULL
== qp_table
->zones
)
540 bitmap
= kmalloc(sizeof(*bitmap
), GFP_KERNEL
);
542 if (NULL
== bitmap
) {
547 err
= mlx4_bitmap_init(*bitmap
+ MLX4_QP_TABLE_ZONE_GENERAL
, dev
->caps
.num_qps
,
548 (1 << 23) - 1, reserved_bottom_general
,
549 reserved_top_general
);
554 ++bitmap_initialized
;
556 err
= mlx4_zone_add_one(qp_table
->zones
, *bitmap
+ MLX4_QP_TABLE_ZONE_GENERAL
,
557 MLX4_ZONE_FALLBACK_TO_HIGHER_PRIO
|
559 0, qp_table
->zones_uids
+ MLX4_QP_TABLE_ZONE_GENERAL
);
564 err
= mlx4_bitmap_init(*bitmap
+ MLX4_QP_TABLE_ZONE_RSS
,
566 reserved_bottom_rss
- 1,
567 dev
->caps
.reserved_qps_cnt
[MLX4_QP_REGION_FW
],
568 reserved_bottom_rss
- start_offset_rss
);
573 ++bitmap_initialized
;
575 err
= mlx4_zone_add_one(qp_table
->zones
, *bitmap
+ MLX4_QP_TABLE_ZONE_RSS
,
576 MLX4_ZONE_ALLOW_ALLOC_FROM_LOWER_PRIO
|
577 MLX4_ZONE_ALLOW_ALLOC_FROM_EQ_PRIO
|
578 MLX4_ZONE_USE_RR
, MLX4_QP_TABLE_RSS_ETH_PRIORITY
,
579 0, qp_table
->zones_uids
+ MLX4_QP_TABLE_ZONE_RSS
);
584 last_offset
= dev
->caps
.reserved_qps_cnt
[MLX4_QP_REGION_FW
];
585 /* We have a single zone for the A0 steering QPs area of the FW. This area
586 * needs to be split into subareas. One set of subareas is for RSS QPs
587 * (in which qp number bits 6 and/or 7 are set); the other set of subareas
588 * is for RAW_ETH QPs, which require that both bits 6 and 7 are zero.
589 * Currently, the values returned by the FW (A0 steering area starting qp number
590 * and A0 steering area size) are such that there are only two subareas -- one
591 * for RSS and one for RAW_ETH.
593 for (k
= MLX4_QP_TABLE_ZONE_RSS
+ 1; k
< sizeof(*bitmap
)/sizeof((*bitmap
)[0]);
596 u32 offset
= start_offset_rss
;
600 /* Assuming MLX4_BF_QP_SKIP_MASK is consecutive ones, this calculates
601 * a mask of all LSB bits set until (and not including) the first
602 * set bit of MLX4_BF_QP_SKIP_MASK. For example, if MLX4_BF_QP_SKIP_MASK
603 * is 0xc0, bf_mask will be 0x3f.
605 bf_mask
= (MLX4_BF_QP_SKIP_MASK
& ~(MLX4_BF_QP_SKIP_MASK
- 1)) - 1;
606 requested_size
= min((u32
)MLX4_QP_TABLE_RAW_ETH_SIZE
, bf_mask
+ 1);
608 if (((last_offset
& MLX4_BF_QP_SKIP_MASK
) &&
609 ((int)(max_table_offset
- last_offset
)) >=
610 roundup_pow_of_two(MLX4_BF_QP_SKIP_MASK
)) ||
611 (!(last_offset
& MLX4_BF_QP_SKIP_MASK
) &&
612 !((last_offset
+ requested_size
- 1) &
613 MLX4_BF_QP_SKIP_MASK
)))
614 size
= requested_size
;
616 u32 candidate_offset
=
617 (last_offset
| MLX4_BF_QP_SKIP_MASK
| bf_mask
) + 1;
619 if (last_offset
& MLX4_BF_QP_SKIP_MASK
)
620 last_offset
= candidate_offset
;
622 /* From this point, the BF bits are 0 */
624 if (last_offset
> max_table_offset
) {
628 size
= min3(max_table_offset
- last_offset
,
629 bf_mask
- (last_offset
& bf_mask
),
631 if (size
< requested_size
) {
634 candidate_size
= min3(
635 max_table_offset
- candidate_offset
,
636 bf_mask
- (last_offset
& bf_mask
),
639 /* We will not take this path if last_offset was
640 * already set above to candidate_offset
642 if (candidate_size
> size
) {
643 last_offset
= candidate_offset
;
644 size
= candidate_size
;
651 /* mlx4_bitmap_alloc_range will find a contiguous range of "size"
652 * QPs in which both bits 6 and 7 are zero, because we pass it the
653 * MLX4_BF_SKIP_MASK).
655 offset
= mlx4_bitmap_alloc_range(
656 *bitmap
+ MLX4_QP_TABLE_ZONE_RSS
,
658 MLX4_BF_QP_SKIP_MASK
);
660 if (offset
== (u32
)-1) {
665 last_offset
= offset
+ size
;
667 err
= mlx4_bitmap_init(*bitmap
+ k
, roundup_pow_of_two(size
),
668 roundup_pow_of_two(size
) - 1, 0,
669 roundup_pow_of_two(size
) - size
);
671 /* Add an empty bitmap, we'll allocate from different zones (since
672 * at least one is reserved)
674 err
= mlx4_bitmap_init(*bitmap
+ k
, 1,
675 MLX4_QP_TABLE_RAW_ETH_SIZE
- 1, 0,
677 mlx4_bitmap_alloc_range(*bitmap
+ k
, 1, 1, 0);
683 ++bitmap_initialized
;
685 err
= mlx4_zone_add_one(qp_table
->zones
, *bitmap
+ k
,
686 MLX4_ZONE_ALLOW_ALLOC_FROM_LOWER_PRIO
|
687 MLX4_ZONE_ALLOW_ALLOC_FROM_EQ_PRIO
|
688 MLX4_ZONE_USE_RR
, MLX4_QP_TABLE_RAW_ETH_PRIORITY
,
689 offset
, qp_table
->zones_uids
+ k
);
698 qp_table
->bitmap_gen
= *bitmap
;
703 for (k
= 0; k
< bitmap_initialized
; k
++)
704 mlx4_bitmap_cleanup(*bitmap
+ k
);
707 mlx4_zone_allocator_destroy(qp_table
->zones
);
711 static void mlx4_cleanup_qp_zones(struct mlx4_dev
*dev
)
713 struct mlx4_qp_table
*qp_table
= &mlx4_priv(dev
)->qp_table
;
715 if (qp_table
->zones
) {
719 i
< sizeof(qp_table
->zones_uids
)/sizeof(qp_table
->zones_uids
[0]);
721 struct mlx4_bitmap
*bitmap
=
722 mlx4_zone_get_bitmap(qp_table
->zones
,
723 qp_table
->zones_uids
[i
]);
725 mlx4_zone_remove_one(qp_table
->zones
, qp_table
->zones_uids
[i
]);
729 mlx4_bitmap_cleanup(bitmap
);
731 mlx4_zone_allocator_destroy(qp_table
->zones
);
732 kfree(qp_table
->bitmap_gen
);
733 qp_table
->bitmap_gen
= NULL
;
734 qp_table
->zones
= NULL
;
738 int mlx4_init_qp_table(struct mlx4_dev
*dev
)
740 struct mlx4_qp_table
*qp_table
= &mlx4_priv(dev
)->qp_table
;
742 int reserved_from_top
= 0;
743 int reserved_from_bot
;
745 int fixed_reserved_from_bot_rv
= 0;
746 int bottom_reserved_for_rss_bitmap
;
747 u32 max_table_offset
= dev
->caps
.dmfs_high_rate_qpn_base
+
748 dev
->caps
.dmfs_high_rate_qpn_range
;
750 spin_lock_init(&qp_table
->lock
);
751 INIT_RADIX_TREE(&dev
->qp_table_tree
, GFP_ATOMIC
);
752 if (mlx4_is_slave(dev
))
755 /* We reserve 2 extra QPs per port for the special QPs. The
756 * block of special QPs must be aligned to a multiple of 8, so
759 * We also reserve the MSB of the 24-bit QP number to indicate
760 * that a QP is an XRC QP.
762 for (k
= 0; k
<= MLX4_QP_REGION_BOTTOM
; k
++)
763 fixed_reserved_from_bot_rv
+= dev
->caps
.reserved_qps_cnt
[k
];
765 if (fixed_reserved_from_bot_rv
< max_table_offset
)
766 fixed_reserved_from_bot_rv
= max_table_offset
;
768 /* We reserve at least 1 extra for bitmaps that we don't have enough space for*/
769 bottom_reserved_for_rss_bitmap
=
770 roundup_pow_of_two(fixed_reserved_from_bot_rv
+ 1);
771 dev
->phys_caps
.base_sqpn
= ALIGN(bottom_reserved_for_rss_bitmap
, 8);
774 int sort
[MLX4_NUM_QP_REGION
];
776 int last_base
= dev
->caps
.num_qps
;
778 for (i
= 1; i
< MLX4_NUM_QP_REGION
; ++i
)
781 for (i
= MLX4_NUM_QP_REGION
; i
> MLX4_QP_REGION_BOTTOM
; --i
) {
782 for (j
= MLX4_QP_REGION_BOTTOM
+ 2; j
< i
; ++j
) {
783 if (dev
->caps
.reserved_qps_cnt
[sort
[j
]] >
784 dev
->caps
.reserved_qps_cnt
[sort
[j
- 1]])
785 swap(sort
[j
], sort
[j
- 1]);
789 for (i
= MLX4_QP_REGION_BOTTOM
+ 1; i
< MLX4_NUM_QP_REGION
; ++i
) {
790 last_base
-= dev
->caps
.reserved_qps_cnt
[sort
[i
]];
791 dev
->caps
.reserved_qps_base
[sort
[i
]] = last_base
;
793 dev
->caps
.reserved_qps_cnt
[sort
[i
]];
797 /* Reserve 8 real SQPs in both native and SRIOV modes.
798 * In addition, in SRIOV mode, reserve 8 proxy SQPs per function
799 * (for all PFs and VFs), and 8 corresponding tunnel QPs.
800 * Each proxy SQP works opposite its own tunnel QP.
802 * The QPs are arranged as follows:
804 * b. All the proxy SQPs (8 per function)
805 * c. All the tunnel QPs (8 per function)
807 reserved_from_bot
= mlx4_num_reserved_sqps(dev
);
808 if (reserved_from_bot
+ reserved_from_top
> dev
->caps
.num_qps
) {
809 mlx4_err(dev
, "Number of reserved QPs is higher than number of QPs\n");
813 err
= mlx4_create_zones(dev
, reserved_from_bot
, reserved_from_bot
,
814 bottom_reserved_for_rss_bitmap
,
815 fixed_reserved_from_bot_rv
,
821 if (mlx4_is_mfunc(dev
)) {
823 dev
->phys_caps
.base_proxy_sqpn
= dev
->phys_caps
.base_sqpn
+ 8;
824 dev
->phys_caps
.base_tunnel_sqpn
= dev
->phys_caps
.base_sqpn
+ 8 + 8 * MLX4_MFUNC_MAX
;
826 /* In mfunc, calculate proxy and tunnel qp offsets for the PF here,
827 * since the PF does not call mlx4_slave_caps */
828 dev
->caps
.qp0_tunnel
= kcalloc(dev
->caps
.num_ports
, sizeof (u32
), GFP_KERNEL
);
829 dev
->caps
.qp0_proxy
= kcalloc(dev
->caps
.num_ports
, sizeof (u32
), GFP_KERNEL
);
830 dev
->caps
.qp1_tunnel
= kcalloc(dev
->caps
.num_ports
, sizeof (u32
), GFP_KERNEL
);
831 dev
->caps
.qp1_proxy
= kcalloc(dev
->caps
.num_ports
, sizeof (u32
), GFP_KERNEL
);
833 if (!dev
->caps
.qp0_tunnel
|| !dev
->caps
.qp0_proxy
||
834 !dev
->caps
.qp1_tunnel
|| !dev
->caps
.qp1_proxy
) {
839 for (k
= 0; k
< dev
->caps
.num_ports
; k
++) {
840 dev
->caps
.qp0_proxy
[k
] = dev
->phys_caps
.base_proxy_sqpn
+
841 8 * mlx4_master_func_num(dev
) + k
;
842 dev
->caps
.qp0_tunnel
[k
] = dev
->caps
.qp0_proxy
[k
] + 8 * MLX4_MFUNC_MAX
;
843 dev
->caps
.qp1_proxy
[k
] = dev
->phys_caps
.base_proxy_sqpn
+
844 8 * mlx4_master_func_num(dev
) + MLX4_MAX_PORTS
+ k
;
845 dev
->caps
.qp1_tunnel
[k
] = dev
->caps
.qp1_proxy
[k
] + 8 * MLX4_MFUNC_MAX
;
850 err
= mlx4_CONF_SPECIAL_QP(dev
, dev
->phys_caps
.base_sqpn
);
857 kfree(dev
->caps
.qp0_tunnel
);
858 kfree(dev
->caps
.qp0_proxy
);
859 kfree(dev
->caps
.qp1_tunnel
);
860 kfree(dev
->caps
.qp1_proxy
);
861 dev
->caps
.qp0_tunnel
= dev
->caps
.qp0_proxy
=
862 dev
->caps
.qp1_tunnel
= dev
->caps
.qp1_proxy
= NULL
;
863 mlx4_cleanup_qp_zones(dev
);
867 void mlx4_cleanup_qp_table(struct mlx4_dev
*dev
)
869 if (mlx4_is_slave(dev
))
872 mlx4_CONF_SPECIAL_QP(dev
, 0);
874 mlx4_cleanup_qp_zones(dev
);
877 int mlx4_qp_query(struct mlx4_dev
*dev
, struct mlx4_qp
*qp
,
878 struct mlx4_qp_context
*context
)
880 struct mlx4_cmd_mailbox
*mailbox
;
883 mailbox
= mlx4_alloc_cmd_mailbox(dev
);
885 return PTR_ERR(mailbox
);
887 err
= mlx4_cmd_box(dev
, 0, mailbox
->dma
, qp
->qpn
, 0,
888 MLX4_CMD_QUERY_QP
, MLX4_CMD_TIME_CLASS_A
,
891 memcpy(context
, mailbox
->buf
+ 8, sizeof *context
);
893 mlx4_free_cmd_mailbox(dev
, mailbox
);
896 EXPORT_SYMBOL_GPL(mlx4_qp_query
);
898 int mlx4_qp_to_ready(struct mlx4_dev
*dev
, struct mlx4_mtt
*mtt
,
899 struct mlx4_qp_context
*context
,
900 struct mlx4_qp
*qp
, enum mlx4_qp_state
*qp_state
)
904 enum mlx4_qp_state states
[] = {
911 for (i
= 0; i
< ARRAY_SIZE(states
) - 1; i
++) {
912 context
->flags
&= cpu_to_be32(~(0xf << 28));
913 context
->flags
|= cpu_to_be32(states
[i
+ 1] << 28);
914 if (states
[i
+ 1] != MLX4_QP_STATE_RTR
)
915 context
->params2
&= ~MLX4_QP_BIT_FPP
;
916 err
= mlx4_qp_modify(dev
, mtt
, states
[i
], states
[i
+ 1],
919 mlx4_err(dev
, "Failed to bring QP to state: %d with error: %d\n",
924 *qp_state
= states
[i
+ 1];
929 EXPORT_SYMBOL_GPL(mlx4_qp_to_ready
);
931 u16
mlx4_qp_roce_entropy(struct mlx4_dev
*dev
, u32 qpn
)
933 struct mlx4_qp_context context
;
938 err
= mlx4_qp_query(dev
, &qp
, &context
);
940 u32 dest_qpn
= be32_to_cpu(context
.remote_qpn
) & 0xffffff;
941 u16 folded_dst
= folded_qp(dest_qpn
);
942 u16 folded_src
= folded_qp(qpn
);
944 return (dest_qpn
!= qpn
) ?
945 ((folded_dst
^ folded_src
) | 0xC000) :