2 * Copyright (c) 2015, Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33 #include <linux/etherdevice.h>
34 #include <linux/mlx5/driver.h>
35 #include <linux/mlx5/mlx5_ifc.h>
36 #include <linux/mlx5/vport.h>
37 #include <linux/mlx5/fs.h>
38 #include "esw/acl/lgcy.h"
39 #include "mlx5_core.h"
45 #include "en/mod_hdr.h"
53 /* Vport UC/MC hash node */
55 struct l2addr_node node
;
58 struct mlx5_flow_handle
*flow_rule
;
59 bool mpfs
; /* UC MAC was added to MPFs */
60 /* A flag indicating that mac was added due to mc promiscuous vport */
64 static void esw_destroy_legacy_fdb_table(struct mlx5_eswitch
*esw
);
65 static void esw_cleanup_vepa_rules(struct mlx5_eswitch
*esw
);
67 static int mlx5_eswitch_check(const struct mlx5_core_dev
*dev
)
69 if (MLX5_CAP_GEN(dev
, port_type
) != MLX5_CAP_PORT_TYPE_ETH
)
72 if (!MLX5_ESWITCH_MANAGER(dev
))
78 struct mlx5_eswitch
*mlx5_devlink_eswitch_get(struct devlink
*devlink
)
80 struct mlx5_core_dev
*dev
= devlink_priv(devlink
);
83 err
= mlx5_eswitch_check(dev
);
87 return dev
->priv
.eswitch
;
90 struct mlx5_vport
*__must_check
91 mlx5_eswitch_get_vport(struct mlx5_eswitch
*esw
, u16 vport_num
)
95 if (!esw
|| !MLX5_CAP_GEN(esw
->dev
, vport_group_manager
))
96 return ERR_PTR(-EPERM
);
98 idx
= mlx5_eswitch_vport_num_to_index(esw
, vport_num
);
100 if (idx
> esw
->total_vports
- 1) {
101 esw_debug(esw
->dev
, "vport out of range: num(0x%x), idx(0x%x)\n",
103 return ERR_PTR(-EINVAL
);
106 return &esw
->vports
[idx
];
109 static int arm_vport_context_events_cmd(struct mlx5_core_dev
*dev
, u16 vport
,
112 u32 in
[MLX5_ST_SZ_DW(modify_nic_vport_context_in
)] = {};
115 MLX5_SET(modify_nic_vport_context_in
, in
,
116 opcode
, MLX5_CMD_OP_MODIFY_NIC_VPORT_CONTEXT
);
117 MLX5_SET(modify_nic_vport_context_in
, in
, field_select
.change_event
, 1);
118 MLX5_SET(modify_nic_vport_context_in
, in
, vport_number
, vport
);
119 MLX5_SET(modify_nic_vport_context_in
, in
, other_vport
, 1);
120 nic_vport_ctx
= MLX5_ADDR_OF(modify_nic_vport_context_in
,
121 in
, nic_vport_context
);
123 MLX5_SET(nic_vport_context
, nic_vport_ctx
, arm_change_event
, 1);
125 if (events_mask
& MLX5_VPORT_UC_ADDR_CHANGE
)
126 MLX5_SET(nic_vport_context
, nic_vport_ctx
,
127 event_on_uc_address_change
, 1);
128 if (events_mask
& MLX5_VPORT_MC_ADDR_CHANGE
)
129 MLX5_SET(nic_vport_context
, nic_vport_ctx
,
130 event_on_mc_address_change
, 1);
131 if (events_mask
& MLX5_VPORT_PROMISC_CHANGE
)
132 MLX5_SET(nic_vport_context
, nic_vport_ctx
,
133 event_on_promisc_change
, 1);
135 return mlx5_cmd_exec_in(dev
, modify_nic_vport_context
, in
);
138 /* E-Switch vport context HW commands */
139 int mlx5_eswitch_modify_esw_vport_context(struct mlx5_core_dev
*dev
, u16 vport
,
140 bool other_vport
, void *in
)
142 MLX5_SET(modify_esw_vport_context_in
, in
, opcode
,
143 MLX5_CMD_OP_MODIFY_ESW_VPORT_CONTEXT
);
144 MLX5_SET(modify_esw_vport_context_in
, in
, vport_number
, vport
);
145 MLX5_SET(modify_esw_vport_context_in
, in
, other_vport
, other_vport
);
146 return mlx5_cmd_exec_in(dev
, modify_esw_vport_context
, in
);
149 static int modify_esw_vport_cvlan(struct mlx5_core_dev
*dev
, u16 vport
,
150 u16 vlan
, u8 qos
, u8 set_flags
)
152 u32 in
[MLX5_ST_SZ_DW(modify_esw_vport_context_in
)] = {};
154 if (!MLX5_CAP_ESW(dev
, vport_cvlan_strip
) ||
155 !MLX5_CAP_ESW(dev
, vport_cvlan_insert_if_not_exist
))
158 esw_debug(dev
, "Set Vport[%d] VLAN %d qos %d set=%x\n",
159 vport
, vlan
, qos
, set_flags
);
161 if (set_flags
& SET_VLAN_STRIP
)
162 MLX5_SET(modify_esw_vport_context_in
, in
,
163 esw_vport_context
.vport_cvlan_strip
, 1);
165 if (set_flags
& SET_VLAN_INSERT
) {
166 /* insert only if no vlan in packet */
167 MLX5_SET(modify_esw_vport_context_in
, in
,
168 esw_vport_context
.vport_cvlan_insert
, 1);
170 MLX5_SET(modify_esw_vport_context_in
, in
,
171 esw_vport_context
.cvlan_pcp
, qos
);
172 MLX5_SET(modify_esw_vport_context_in
, in
,
173 esw_vport_context
.cvlan_id
, vlan
);
176 MLX5_SET(modify_esw_vport_context_in
, in
,
177 field_select
.vport_cvlan_strip
, 1);
178 MLX5_SET(modify_esw_vport_context_in
, in
,
179 field_select
.vport_cvlan_insert
, 1);
181 return mlx5_eswitch_modify_esw_vport_context(dev
, vport
, true, in
);
185 static struct mlx5_flow_handle
*
186 __esw_fdb_set_vport_rule(struct mlx5_eswitch
*esw
, u16 vport
, bool rx_rule
,
187 u8 mac_c
[ETH_ALEN
], u8 mac_v
[ETH_ALEN
])
189 int match_header
= (is_zero_ether_addr(mac_c
) ? 0 :
190 MLX5_MATCH_OUTER_HEADERS
);
191 struct mlx5_flow_handle
*flow_rule
= NULL
;
192 struct mlx5_flow_act flow_act
= {0};
193 struct mlx5_flow_destination dest
= {};
194 struct mlx5_flow_spec
*spec
;
195 void *mv_misc
= NULL
;
196 void *mc_misc
= NULL
;
201 match_header
|= MLX5_MATCH_MISC_PARAMETERS
;
203 spec
= kvzalloc(sizeof(*spec
), GFP_KERNEL
);
207 dmac_v
= MLX5_ADDR_OF(fte_match_param
, spec
->match_value
,
208 outer_headers
.dmac_47_16
);
209 dmac_c
= MLX5_ADDR_OF(fte_match_param
, spec
->match_criteria
,
210 outer_headers
.dmac_47_16
);
212 if (match_header
& MLX5_MATCH_OUTER_HEADERS
) {
213 ether_addr_copy(dmac_v
, mac_v
);
214 ether_addr_copy(dmac_c
, mac_c
);
217 if (match_header
& MLX5_MATCH_MISC_PARAMETERS
) {
218 mv_misc
= MLX5_ADDR_OF(fte_match_param
, spec
->match_value
,
220 mc_misc
= MLX5_ADDR_OF(fte_match_param
, spec
->match_criteria
,
222 MLX5_SET(fte_match_set_misc
, mv_misc
, source_port
, MLX5_VPORT_UPLINK
);
223 MLX5_SET_TO_ONES(fte_match_set_misc
, mc_misc
, source_port
);
226 dest
.type
= MLX5_FLOW_DESTINATION_TYPE_VPORT
;
227 dest
.vport
.num
= vport
;
230 "\tFDB add rule dmac_v(%pM) dmac_c(%pM) -> vport(%d)\n",
231 dmac_v
, dmac_c
, vport
);
232 spec
->match_criteria_enable
= match_header
;
233 flow_act
.action
= MLX5_FLOW_CONTEXT_ACTION_FWD_DEST
;
235 mlx5_add_flow_rules(esw
->fdb_table
.legacy
.fdb
, spec
,
236 &flow_act
, &dest
, 1);
237 if (IS_ERR(flow_rule
)) {
239 "FDB: Failed to add flow rule: dmac_v(%pM) dmac_c(%pM) -> vport(%d), err(%ld)\n",
240 dmac_v
, dmac_c
, vport
, PTR_ERR(flow_rule
));
248 static struct mlx5_flow_handle
*
249 esw_fdb_set_vport_rule(struct mlx5_eswitch
*esw
, u8 mac
[ETH_ALEN
], u16 vport
)
253 eth_broadcast_addr(mac_c
);
254 return __esw_fdb_set_vport_rule(esw
, vport
, false, mac_c
, mac
);
257 static struct mlx5_flow_handle
*
258 esw_fdb_set_vport_allmulti_rule(struct mlx5_eswitch
*esw
, u16 vport
)
263 eth_zero_addr(mac_c
);
264 eth_zero_addr(mac_v
);
267 return __esw_fdb_set_vport_rule(esw
, vport
, false, mac_c
, mac_v
);
270 static struct mlx5_flow_handle
*
271 esw_fdb_set_vport_promisc_rule(struct mlx5_eswitch
*esw
, u16 vport
)
276 eth_zero_addr(mac_c
);
277 eth_zero_addr(mac_v
);
278 return __esw_fdb_set_vport_rule(esw
, vport
, true, mac_c
, mac_v
);
282 LEGACY_VEPA_PRIO
= 0,
286 static int esw_create_legacy_vepa_table(struct mlx5_eswitch
*esw
)
288 struct mlx5_flow_table_attr ft_attr
= {};
289 struct mlx5_core_dev
*dev
= esw
->dev
;
290 struct mlx5_flow_namespace
*root_ns
;
291 struct mlx5_flow_table
*fdb
;
294 root_ns
= mlx5_get_fdb_sub_ns(dev
, 0);
296 esw_warn(dev
, "Failed to get FDB flow namespace\n");
300 /* num FTE 2, num FG 2 */
301 ft_attr
.prio
= LEGACY_VEPA_PRIO
;
303 ft_attr
.autogroup
.max_num_groups
= 2;
304 fdb
= mlx5_create_auto_grouped_flow_table(root_ns
, &ft_attr
);
307 esw_warn(dev
, "Failed to create VEPA FDB err %d\n", err
);
310 esw
->fdb_table
.legacy
.vepa_fdb
= fdb
;
315 static int esw_create_legacy_fdb_table(struct mlx5_eswitch
*esw
)
317 int inlen
= MLX5_ST_SZ_BYTES(create_flow_group_in
);
318 struct mlx5_flow_table_attr ft_attr
= {};
319 struct mlx5_core_dev
*dev
= esw
->dev
;
320 struct mlx5_flow_namespace
*root_ns
;
321 struct mlx5_flow_table
*fdb
;
322 struct mlx5_flow_group
*g
;
323 void *match_criteria
;
329 esw_debug(dev
, "Create FDB log_max_size(%d)\n",
330 MLX5_CAP_ESW_FLOWTABLE_FDB(dev
, log_max_ft_size
));
332 root_ns
= mlx5_get_fdb_sub_ns(dev
, 0);
334 esw_warn(dev
, "Failed to get FDB flow namespace\n");
338 flow_group_in
= kvzalloc(inlen
, GFP_KERNEL
);
342 table_size
= BIT(MLX5_CAP_ESW_FLOWTABLE_FDB(dev
, log_max_ft_size
));
343 ft_attr
.max_fte
= table_size
;
344 ft_attr
.prio
= LEGACY_FDB_PRIO
;
345 fdb
= mlx5_create_flow_table(root_ns
, &ft_attr
);
348 esw_warn(dev
, "Failed to create FDB Table err %d\n", err
);
351 esw
->fdb_table
.legacy
.fdb
= fdb
;
353 /* Addresses group : Full match unicast/multicast addresses */
354 MLX5_SET(create_flow_group_in
, flow_group_in
, match_criteria_enable
,
355 MLX5_MATCH_OUTER_HEADERS
);
356 match_criteria
= MLX5_ADDR_OF(create_flow_group_in
, flow_group_in
, match_criteria
);
357 dmac
= MLX5_ADDR_OF(fte_match_param
, match_criteria
, outer_headers
.dmac_47_16
);
358 MLX5_SET(create_flow_group_in
, flow_group_in
, start_flow_index
, 0);
359 /* Preserve 2 entries for allmulti and promisc rules*/
360 MLX5_SET(create_flow_group_in
, flow_group_in
, end_flow_index
, table_size
- 3);
361 eth_broadcast_addr(dmac
);
362 g
= mlx5_create_flow_group(fdb
, flow_group_in
);
365 esw_warn(dev
, "Failed to create flow group err(%d)\n", err
);
368 esw
->fdb_table
.legacy
.addr_grp
= g
;
370 /* Allmulti group : One rule that forwards any mcast traffic */
371 MLX5_SET(create_flow_group_in
, flow_group_in
, match_criteria_enable
,
372 MLX5_MATCH_OUTER_HEADERS
);
373 MLX5_SET(create_flow_group_in
, flow_group_in
, start_flow_index
, table_size
- 2);
374 MLX5_SET(create_flow_group_in
, flow_group_in
, end_flow_index
, table_size
- 2);
377 g
= mlx5_create_flow_group(fdb
, flow_group_in
);
380 esw_warn(dev
, "Failed to create allmulti flow group err(%d)\n", err
);
383 esw
->fdb_table
.legacy
.allmulti_grp
= g
;
385 /* Promiscuous group :
386 * One rule that forward all unmatched traffic from previous groups
389 MLX5_SET(create_flow_group_in
, flow_group_in
, match_criteria_enable
,
390 MLX5_MATCH_MISC_PARAMETERS
);
391 MLX5_SET_TO_ONES(fte_match_param
, match_criteria
, misc_parameters
.source_port
);
392 MLX5_SET(create_flow_group_in
, flow_group_in
, start_flow_index
, table_size
- 1);
393 MLX5_SET(create_flow_group_in
, flow_group_in
, end_flow_index
, table_size
- 1);
394 g
= mlx5_create_flow_group(fdb
, flow_group_in
);
397 esw_warn(dev
, "Failed to create promisc flow group err(%d)\n", err
);
400 esw
->fdb_table
.legacy
.promisc_grp
= g
;
404 esw_destroy_legacy_fdb_table(esw
);
406 kvfree(flow_group_in
);
410 static void esw_destroy_legacy_vepa_table(struct mlx5_eswitch
*esw
)
412 esw_debug(esw
->dev
, "Destroy VEPA Table\n");
413 if (!esw
->fdb_table
.legacy
.vepa_fdb
)
416 mlx5_destroy_flow_table(esw
->fdb_table
.legacy
.vepa_fdb
);
417 esw
->fdb_table
.legacy
.vepa_fdb
= NULL
;
420 static void esw_destroy_legacy_fdb_table(struct mlx5_eswitch
*esw
)
422 esw_debug(esw
->dev
, "Destroy FDB Table\n");
423 if (!esw
->fdb_table
.legacy
.fdb
)
426 if (esw
->fdb_table
.legacy
.promisc_grp
)
427 mlx5_destroy_flow_group(esw
->fdb_table
.legacy
.promisc_grp
);
428 if (esw
->fdb_table
.legacy
.allmulti_grp
)
429 mlx5_destroy_flow_group(esw
->fdb_table
.legacy
.allmulti_grp
);
430 if (esw
->fdb_table
.legacy
.addr_grp
)
431 mlx5_destroy_flow_group(esw
->fdb_table
.legacy
.addr_grp
);
432 mlx5_destroy_flow_table(esw
->fdb_table
.legacy
.fdb
);
434 esw
->fdb_table
.legacy
.fdb
= NULL
;
435 esw
->fdb_table
.legacy
.addr_grp
= NULL
;
436 esw
->fdb_table
.legacy
.allmulti_grp
= NULL
;
437 esw
->fdb_table
.legacy
.promisc_grp
= NULL
;
440 static int esw_create_legacy_table(struct mlx5_eswitch
*esw
)
444 memset(&esw
->fdb_table
.legacy
, 0, sizeof(struct legacy_fdb
));
446 err
= esw_create_legacy_vepa_table(esw
);
450 err
= esw_create_legacy_fdb_table(esw
);
452 esw_destroy_legacy_vepa_table(esw
);
457 static void esw_destroy_legacy_table(struct mlx5_eswitch
*esw
)
459 esw_cleanup_vepa_rules(esw
);
460 esw_destroy_legacy_fdb_table(esw
);
461 esw_destroy_legacy_vepa_table(esw
);
464 #define MLX5_LEGACY_SRIOV_VPORT_EVENTS (MLX5_VPORT_UC_ADDR_CHANGE | \
465 MLX5_VPORT_MC_ADDR_CHANGE | \
466 MLX5_VPORT_PROMISC_CHANGE)
468 static int esw_legacy_enable(struct mlx5_eswitch
*esw
)
470 struct mlx5_vport
*vport
;
473 ret
= esw_create_legacy_table(esw
);
477 mlx5_esw_for_each_vf_vport(esw
, i
, vport
, esw
->esw_funcs
.num_vfs
)
478 vport
->info
.link_state
= MLX5_VPORT_ADMIN_STATE_AUTO
;
480 ret
= mlx5_eswitch_enable_pf_vf_vports(esw
, MLX5_LEGACY_SRIOV_VPORT_EVENTS
);
482 esw_destroy_legacy_table(esw
);
486 static void esw_legacy_disable(struct mlx5_eswitch
*esw
)
488 struct esw_mc_addr
*mc_promisc
;
490 mlx5_eswitch_disable_pf_vf_vports(esw
);
492 mc_promisc
= &esw
->mc_promisc
;
493 if (mc_promisc
->uplink_rule
)
494 mlx5_del_flow_rules(mc_promisc
->uplink_rule
);
496 esw_destroy_legacy_table(esw
);
499 /* E-Switch vport UC/MC lists management */
500 typedef int (*vport_addr_action
)(struct mlx5_eswitch
*esw
,
501 struct vport_addr
*vaddr
);
503 static int esw_add_uc_addr(struct mlx5_eswitch
*esw
, struct vport_addr
*vaddr
)
505 u8
*mac
= vaddr
->node
.addr
;
506 u16 vport
= vaddr
->vport
;
509 /* Skip mlx5_mpfs_add_mac for eswitch_managers,
510 * it is already done by its netdev in mlx5e_execute_l2_action
512 if (mlx5_esw_is_manager_vport(esw
, vport
))
515 err
= mlx5_mpfs_add_mac(esw
->dev
, mac
);
518 "Failed to add L2 table mac(%pM) for vport(0x%x), err(%d)\n",
525 /* SRIOV is enabled: Forward UC MAC to vport */
526 if (esw
->fdb_table
.legacy
.fdb
&& esw
->mode
== MLX5_ESWITCH_LEGACY
)
527 vaddr
->flow_rule
= esw_fdb_set_vport_rule(esw
, mac
, vport
);
529 esw_debug(esw
->dev
, "\tADDED UC MAC: vport[%d] %pM fr(%p)\n",
530 vport
, mac
, vaddr
->flow_rule
);
535 static int esw_del_uc_addr(struct mlx5_eswitch
*esw
, struct vport_addr
*vaddr
)
537 u8
*mac
= vaddr
->node
.addr
;
538 u16 vport
= vaddr
->vport
;
541 /* Skip mlx5_mpfs_del_mac for eswitch managers,
542 * it is already done by its netdev in mlx5e_execute_l2_action
544 if (!vaddr
->mpfs
|| mlx5_esw_is_manager_vport(esw
, vport
))
547 err
= mlx5_mpfs_del_mac(esw
->dev
, mac
);
550 "Failed to del L2 table mac(%pM) for vport(%d), err(%d)\n",
555 if (vaddr
->flow_rule
)
556 mlx5_del_flow_rules(vaddr
->flow_rule
);
557 vaddr
->flow_rule
= NULL
;
562 static void update_allmulti_vports(struct mlx5_eswitch
*esw
,
563 struct vport_addr
*vaddr
,
564 struct esw_mc_addr
*esw_mc
)
566 u8
*mac
= vaddr
->node
.addr
;
567 struct mlx5_vport
*vport
;
570 mlx5_esw_for_all_vports(esw
, i
, vport
) {
571 struct hlist_head
*vport_hash
= vport
->mc_list
;
572 struct vport_addr
*iter_vaddr
=
573 l2addr_hash_find(vport_hash
,
576 vport_num
= vport
->vport
;
577 if (IS_ERR_OR_NULL(vport
->allmulti_rule
) ||
578 vaddr
->vport
== vport_num
)
580 switch (vaddr
->action
) {
581 case MLX5_ACTION_ADD
:
584 iter_vaddr
= l2addr_hash_add(vport_hash
, mac
,
589 "ALL-MULTI: Failed to add MAC(%pM) to vport[%d] DB\n",
593 iter_vaddr
->vport
= vport_num
;
594 iter_vaddr
->flow_rule
=
595 esw_fdb_set_vport_rule(esw
,
598 iter_vaddr
->mc_promisc
= true;
600 case MLX5_ACTION_DEL
:
603 mlx5_del_flow_rules(iter_vaddr
->flow_rule
);
604 l2addr_hash_del(iter_vaddr
);
610 static int esw_add_mc_addr(struct mlx5_eswitch
*esw
, struct vport_addr
*vaddr
)
612 struct hlist_head
*hash
= esw
->mc_table
;
613 struct esw_mc_addr
*esw_mc
;
614 u8
*mac
= vaddr
->node
.addr
;
615 u16 vport
= vaddr
->vport
;
617 if (!esw
->fdb_table
.legacy
.fdb
)
620 esw_mc
= l2addr_hash_find(hash
, mac
, struct esw_mc_addr
);
624 esw_mc
= l2addr_hash_add(hash
, mac
, struct esw_mc_addr
, GFP_KERNEL
);
628 esw_mc
->uplink_rule
= /* Forward MC MAC to Uplink */
629 esw_fdb_set_vport_rule(esw
, mac
, MLX5_VPORT_UPLINK
);
631 /* Add this multicast mac to all the mc promiscuous vports */
632 update_allmulti_vports(esw
, vaddr
, esw_mc
);
635 /* If the multicast mac is added as a result of mc promiscuous vport,
636 * don't increment the multicast ref count
638 if (!vaddr
->mc_promisc
)
641 /* Forward MC MAC to vport */
642 vaddr
->flow_rule
= esw_fdb_set_vport_rule(esw
, mac
, vport
);
644 "\tADDED MC MAC: vport[%d] %pM fr(%p) refcnt(%d) uplinkfr(%p)\n",
645 vport
, mac
, vaddr
->flow_rule
,
646 esw_mc
->refcnt
, esw_mc
->uplink_rule
);
650 static int esw_del_mc_addr(struct mlx5_eswitch
*esw
, struct vport_addr
*vaddr
)
652 struct hlist_head
*hash
= esw
->mc_table
;
653 struct esw_mc_addr
*esw_mc
;
654 u8
*mac
= vaddr
->node
.addr
;
655 u16 vport
= vaddr
->vport
;
657 if (!esw
->fdb_table
.legacy
.fdb
)
660 esw_mc
= l2addr_hash_find(hash
, mac
, struct esw_mc_addr
);
663 "Failed to find eswitch MC addr for MAC(%pM) vport(%d)",
668 "\tDELETE MC MAC: vport[%d] %pM fr(%p) refcnt(%d) uplinkfr(%p)\n",
669 vport
, mac
, vaddr
->flow_rule
, esw_mc
->refcnt
,
670 esw_mc
->uplink_rule
);
672 if (vaddr
->flow_rule
)
673 mlx5_del_flow_rules(vaddr
->flow_rule
);
674 vaddr
->flow_rule
= NULL
;
676 /* If the multicast mac is added as a result of mc promiscuous vport,
677 * don't decrement the multicast ref count.
679 if (vaddr
->mc_promisc
|| (--esw_mc
->refcnt
> 0))
682 /* Remove this multicast mac from all the mc promiscuous vports */
683 update_allmulti_vports(esw
, vaddr
, esw_mc
);
685 if (esw_mc
->uplink_rule
)
686 mlx5_del_flow_rules(esw_mc
->uplink_rule
);
688 l2addr_hash_del(esw_mc
);
692 /* Apply vport UC/MC list to HW l2 table and FDB table */
693 static void esw_apply_vport_addr_list(struct mlx5_eswitch
*esw
,
694 struct mlx5_vport
*vport
, int list_type
)
696 bool is_uc
= list_type
== MLX5_NVPRT_LIST_TYPE_UC
;
697 vport_addr_action vport_addr_add
;
698 vport_addr_action vport_addr_del
;
699 struct vport_addr
*addr
;
700 struct l2addr_node
*node
;
701 struct hlist_head
*hash
;
702 struct hlist_node
*tmp
;
705 vport_addr_add
= is_uc
? esw_add_uc_addr
:
707 vport_addr_del
= is_uc
? esw_del_uc_addr
:
710 hash
= is_uc
? vport
->uc_list
: vport
->mc_list
;
711 for_each_l2hash_node(node
, tmp
, hash
, hi
) {
712 addr
= container_of(node
, struct vport_addr
, node
);
713 switch (addr
->action
) {
714 case MLX5_ACTION_ADD
:
715 vport_addr_add(esw
, addr
);
716 addr
->action
= MLX5_ACTION_NONE
;
718 case MLX5_ACTION_DEL
:
719 vport_addr_del(esw
, addr
);
720 l2addr_hash_del(addr
);
726 /* Sync vport UC/MC list from vport context */
727 static void esw_update_vport_addr_list(struct mlx5_eswitch
*esw
,
728 struct mlx5_vport
*vport
, int list_type
)
730 bool is_uc
= list_type
== MLX5_NVPRT_LIST_TYPE_UC
;
731 u8 (*mac_list
)[ETH_ALEN
];
732 struct l2addr_node
*node
;
733 struct vport_addr
*addr
;
734 struct hlist_head
*hash
;
735 struct hlist_node
*tmp
;
741 size
= is_uc
? MLX5_MAX_UC_PER_VPORT(esw
->dev
) :
742 MLX5_MAX_MC_PER_VPORT(esw
->dev
);
744 mac_list
= kcalloc(size
, ETH_ALEN
, GFP_KERNEL
);
748 hash
= is_uc
? vport
->uc_list
: vport
->mc_list
;
750 for_each_l2hash_node(node
, tmp
, hash
, hi
) {
751 addr
= container_of(node
, struct vport_addr
, node
);
752 addr
->action
= MLX5_ACTION_DEL
;
758 err
= mlx5_query_nic_vport_mac_list(esw
->dev
, vport
->vport
, list_type
,
762 esw_debug(esw
->dev
, "vport[%d] context update %s list size (%d)\n",
763 vport
->vport
, is_uc
? "UC" : "MC", size
);
765 for (i
= 0; i
< size
; i
++) {
766 if (is_uc
&& !is_valid_ether_addr(mac_list
[i
]))
769 if (!is_uc
&& !is_multicast_ether_addr(mac_list
[i
]))
772 addr
= l2addr_hash_find(hash
, mac_list
[i
], struct vport_addr
);
774 addr
->action
= MLX5_ACTION_NONE
;
775 /* If this mac was previously added because of allmulti
776 * promiscuous rx mode, its now converted to be original
779 if (addr
->mc_promisc
) {
780 struct esw_mc_addr
*esw_mc
=
781 l2addr_hash_find(esw
->mc_table
,
786 "Failed to MAC(%pM) in mcast DB\n",
791 addr
->mc_promisc
= false;
796 addr
= l2addr_hash_add(hash
, mac_list
[i
], struct vport_addr
,
800 "Failed to add MAC(%pM) to vport[%d] DB\n",
801 mac_list
[i
], vport
->vport
);
804 addr
->vport
= vport
->vport
;
805 addr
->action
= MLX5_ACTION_ADD
;
811 /* Sync vport UC/MC list from vport context
812 * Must be called after esw_update_vport_addr_list
814 static void esw_update_vport_mc_promisc(struct mlx5_eswitch
*esw
,
815 struct mlx5_vport
*vport
)
817 struct l2addr_node
*node
;
818 struct vport_addr
*addr
;
819 struct hlist_head
*hash
;
820 struct hlist_node
*tmp
;
823 hash
= vport
->mc_list
;
825 for_each_l2hash_node(node
, tmp
, esw
->mc_table
, hi
) {
826 u8
*mac
= node
->addr
;
828 addr
= l2addr_hash_find(hash
, mac
, struct vport_addr
);
830 if (addr
->action
== MLX5_ACTION_DEL
)
831 addr
->action
= MLX5_ACTION_NONE
;
834 addr
= l2addr_hash_add(hash
, mac
, struct vport_addr
,
838 "Failed to add allmulti MAC(%pM) to vport[%d] DB\n",
842 addr
->vport
= vport
->vport
;
843 addr
->action
= MLX5_ACTION_ADD
;
844 addr
->mc_promisc
= true;
848 /* Apply vport rx mode to HW FDB table */
849 static void esw_apply_vport_rx_mode(struct mlx5_eswitch
*esw
,
850 struct mlx5_vport
*vport
,
851 bool promisc
, bool mc_promisc
)
853 struct esw_mc_addr
*allmulti_addr
= &esw
->mc_promisc
;
855 if (IS_ERR_OR_NULL(vport
->allmulti_rule
) != mc_promisc
)
859 vport
->allmulti_rule
=
860 esw_fdb_set_vport_allmulti_rule(esw
, vport
->vport
);
861 if (!allmulti_addr
->uplink_rule
)
862 allmulti_addr
->uplink_rule
=
863 esw_fdb_set_vport_allmulti_rule(esw
,
865 allmulti_addr
->refcnt
++;
866 } else if (vport
->allmulti_rule
) {
867 mlx5_del_flow_rules(vport
->allmulti_rule
);
868 vport
->allmulti_rule
= NULL
;
870 if (--allmulti_addr
->refcnt
> 0)
873 if (allmulti_addr
->uplink_rule
)
874 mlx5_del_flow_rules(allmulti_addr
->uplink_rule
);
875 allmulti_addr
->uplink_rule
= NULL
;
879 if (IS_ERR_OR_NULL(vport
->promisc_rule
) != promisc
)
883 vport
->promisc_rule
=
884 esw_fdb_set_vport_promisc_rule(esw
, vport
->vport
);
885 } else if (vport
->promisc_rule
) {
886 mlx5_del_flow_rules(vport
->promisc_rule
);
887 vport
->promisc_rule
= NULL
;
891 /* Sync vport rx mode from vport context */
892 static void esw_update_vport_rx_mode(struct mlx5_eswitch
*esw
,
893 struct mlx5_vport
*vport
)
900 err
= mlx5_query_nic_vport_promisc(esw
->dev
,
907 esw_debug(esw
->dev
, "vport[%d] context update rx mode promisc_all=%d, all_multi=%d\n",
908 vport
->vport
, promisc_all
, promisc_mc
);
910 if (!vport
->info
.trusted
|| !vport
->enabled
) {
916 esw_apply_vport_rx_mode(esw
, vport
, promisc_all
,
917 (promisc_all
|| promisc_mc
));
920 static void esw_vport_change_handle_locked(struct mlx5_vport
*vport
)
922 struct mlx5_core_dev
*dev
= vport
->dev
;
923 struct mlx5_eswitch
*esw
= dev
->priv
.eswitch
;
926 mlx5_query_nic_vport_mac_address(dev
, vport
->vport
, true, mac
);
927 esw_debug(dev
, "vport[%d] Context Changed: perm mac: %pM\n",
930 if (vport
->enabled_events
& MLX5_VPORT_UC_ADDR_CHANGE
) {
931 esw_update_vport_addr_list(esw
, vport
, MLX5_NVPRT_LIST_TYPE_UC
);
932 esw_apply_vport_addr_list(esw
, vport
, MLX5_NVPRT_LIST_TYPE_UC
);
935 if (vport
->enabled_events
& MLX5_VPORT_MC_ADDR_CHANGE
)
936 esw_update_vport_addr_list(esw
, vport
, MLX5_NVPRT_LIST_TYPE_MC
);
938 if (vport
->enabled_events
& MLX5_VPORT_PROMISC_CHANGE
) {
939 esw_update_vport_rx_mode(esw
, vport
);
940 if (!IS_ERR_OR_NULL(vport
->allmulti_rule
))
941 esw_update_vport_mc_promisc(esw
, vport
);
944 if (vport
->enabled_events
& (MLX5_VPORT_PROMISC_CHANGE
| MLX5_VPORT_MC_ADDR_CHANGE
))
945 esw_apply_vport_addr_list(esw
, vport
, MLX5_NVPRT_LIST_TYPE_MC
);
947 esw_debug(esw
->dev
, "vport[%d] Context Changed: Done\n", vport
->vport
);
949 arm_vport_context_events_cmd(dev
, vport
->vport
,
950 vport
->enabled_events
);
953 static void esw_vport_change_handler(struct work_struct
*work
)
955 struct mlx5_vport
*vport
=
956 container_of(work
, struct mlx5_vport
, vport_change_handler
);
957 struct mlx5_eswitch
*esw
= vport
->dev
->priv
.eswitch
;
959 mutex_lock(&esw
->state_lock
);
960 esw_vport_change_handle_locked(vport
);
961 mutex_unlock(&esw
->state_lock
);
964 static bool element_type_supported(struct mlx5_eswitch
*esw
, int type
)
966 const struct mlx5_core_dev
*dev
= esw
->dev
;
969 case SCHEDULING_CONTEXT_ELEMENT_TYPE_TSAR
:
970 return MLX5_CAP_QOS(dev
, esw_element_type
) &
971 ELEMENT_TYPE_CAP_MASK_TASR
;
972 case SCHEDULING_CONTEXT_ELEMENT_TYPE_VPORT
:
973 return MLX5_CAP_QOS(dev
, esw_element_type
) &
974 ELEMENT_TYPE_CAP_MASK_VPORT
;
975 case SCHEDULING_CONTEXT_ELEMENT_TYPE_VPORT_TC
:
976 return MLX5_CAP_QOS(dev
, esw_element_type
) &
977 ELEMENT_TYPE_CAP_MASK_VPORT_TC
;
978 case SCHEDULING_CONTEXT_ELEMENT_TYPE_PARA_VPORT_TC
:
979 return MLX5_CAP_QOS(dev
, esw_element_type
) &
980 ELEMENT_TYPE_CAP_MASK_PARA_VPORT_TC
;
985 /* Vport QoS management */
986 static void esw_create_tsar(struct mlx5_eswitch
*esw
)
988 u32 tsar_ctx
[MLX5_ST_SZ_DW(scheduling_context
)] = {0};
989 struct mlx5_core_dev
*dev
= esw
->dev
;
993 if (!MLX5_CAP_GEN(dev
, qos
) || !MLX5_CAP_QOS(dev
, esw_scheduling
))
996 if (!element_type_supported(esw
, SCHEDULING_CONTEXT_ELEMENT_TYPE_TSAR
))
999 if (esw
->qos
.enabled
)
1002 MLX5_SET(scheduling_context
, tsar_ctx
, element_type
,
1003 SCHEDULING_CONTEXT_ELEMENT_TYPE_TSAR
);
1005 attr
= MLX5_ADDR_OF(scheduling_context
, tsar_ctx
, element_attributes
);
1006 *attr
= cpu_to_be32(TSAR_ELEMENT_TSAR_TYPE_DWRR
<< 16);
1008 err
= mlx5_create_scheduling_element_cmd(dev
,
1009 SCHEDULING_HIERARCHY_E_SWITCH
,
1011 &esw
->qos
.root_tsar_id
);
1013 esw_warn(esw
->dev
, "E-Switch create TSAR failed (%d)\n", err
);
1017 esw
->qos
.enabled
= true;
1020 static void esw_destroy_tsar(struct mlx5_eswitch
*esw
)
1024 if (!esw
->qos
.enabled
)
1027 err
= mlx5_destroy_scheduling_element_cmd(esw
->dev
,
1028 SCHEDULING_HIERARCHY_E_SWITCH
,
1029 esw
->qos
.root_tsar_id
);
1031 esw_warn(esw
->dev
, "E-Switch destroy TSAR failed (%d)\n", err
);
1033 esw
->qos
.enabled
= false;
1036 static int esw_vport_enable_qos(struct mlx5_eswitch
*esw
,
1037 struct mlx5_vport
*vport
,
1038 u32 initial_max_rate
, u32 initial_bw_share
)
1040 u32 sched_ctx
[MLX5_ST_SZ_DW(scheduling_context
)] = {0};
1041 struct mlx5_core_dev
*dev
= esw
->dev
;
1045 if (!esw
->qos
.enabled
|| !MLX5_CAP_GEN(dev
, qos
) ||
1046 !MLX5_CAP_QOS(dev
, esw_scheduling
))
1049 if (vport
->qos
.enabled
)
1052 MLX5_SET(scheduling_context
, sched_ctx
, element_type
,
1053 SCHEDULING_CONTEXT_ELEMENT_TYPE_VPORT
);
1054 vport_elem
= MLX5_ADDR_OF(scheduling_context
, sched_ctx
,
1055 element_attributes
);
1056 MLX5_SET(vport_element
, vport_elem
, vport_number
, vport
->vport
);
1057 MLX5_SET(scheduling_context
, sched_ctx
, parent_element_id
,
1058 esw
->qos
.root_tsar_id
);
1059 MLX5_SET(scheduling_context
, sched_ctx
, max_average_bw
,
1061 MLX5_SET(scheduling_context
, sched_ctx
, bw_share
, initial_bw_share
);
1063 err
= mlx5_create_scheduling_element_cmd(dev
,
1064 SCHEDULING_HIERARCHY_E_SWITCH
,
1066 &vport
->qos
.esw_tsar_ix
);
1068 esw_warn(esw
->dev
, "E-Switch create TSAR vport element failed (vport=%d,err=%d)\n",
1073 vport
->qos
.enabled
= true;
1077 static void esw_vport_disable_qos(struct mlx5_eswitch
*esw
,
1078 struct mlx5_vport
*vport
)
1082 if (!vport
->qos
.enabled
)
1085 err
= mlx5_destroy_scheduling_element_cmd(esw
->dev
,
1086 SCHEDULING_HIERARCHY_E_SWITCH
,
1087 vport
->qos
.esw_tsar_ix
);
1089 esw_warn(esw
->dev
, "E-Switch destroy TSAR vport element failed (vport=%d,err=%d)\n",
1092 vport
->qos
.enabled
= false;
1095 static int esw_vport_qos_config(struct mlx5_eswitch
*esw
,
1096 struct mlx5_vport
*vport
,
1097 u32 max_rate
, u32 bw_share
)
1099 u32 sched_ctx
[MLX5_ST_SZ_DW(scheduling_context
)] = {0};
1100 struct mlx5_core_dev
*dev
= esw
->dev
;
1105 if (!MLX5_CAP_GEN(dev
, qos
) || !MLX5_CAP_QOS(dev
, esw_scheduling
))
1108 if (!vport
->qos
.enabled
)
1111 MLX5_SET(scheduling_context
, sched_ctx
, element_type
,
1112 SCHEDULING_CONTEXT_ELEMENT_TYPE_VPORT
);
1113 vport_elem
= MLX5_ADDR_OF(scheduling_context
, sched_ctx
,
1114 element_attributes
);
1115 MLX5_SET(vport_element
, vport_elem
, vport_number
, vport
->vport
);
1116 MLX5_SET(scheduling_context
, sched_ctx
, parent_element_id
,
1117 esw
->qos
.root_tsar_id
);
1118 MLX5_SET(scheduling_context
, sched_ctx
, max_average_bw
,
1120 MLX5_SET(scheduling_context
, sched_ctx
, bw_share
, bw_share
);
1121 bitmask
|= MODIFY_SCHEDULING_ELEMENT_IN_MODIFY_BITMASK_MAX_AVERAGE_BW
;
1122 bitmask
|= MODIFY_SCHEDULING_ELEMENT_IN_MODIFY_BITMASK_BW_SHARE
;
1124 err
= mlx5_modify_scheduling_element_cmd(dev
,
1125 SCHEDULING_HIERARCHY_E_SWITCH
,
1127 vport
->qos
.esw_tsar_ix
,
1130 esw_warn(esw
->dev
, "E-Switch modify TSAR vport element failed (vport=%d,err=%d)\n",
1138 int mlx5_esw_modify_vport_rate(struct mlx5_eswitch
*esw
, u16 vport_num
,
1141 u32 ctx
[MLX5_ST_SZ_DW(scheduling_context
)] = {};
1142 struct mlx5_vport
*vport
;
1144 vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
1146 if (!vport
->qos
.enabled
)
1149 MLX5_SET(scheduling_context
, ctx
, max_average_bw
, rate_mbps
);
1151 return mlx5_modify_scheduling_element_cmd(esw
->dev
,
1152 SCHEDULING_HIERARCHY_E_SWITCH
,
1154 vport
->qos
.esw_tsar_ix
,
1155 MODIFY_SCHEDULING_ELEMENT_IN_MODIFY_BITMASK_MAX_AVERAGE_BW
);
1158 static void node_guid_gen_from_mac(u64
*node_guid
, const u8
*mac
)
1160 ((u8
*)node_guid
)[7] = mac
[0];
1161 ((u8
*)node_guid
)[6] = mac
[1];
1162 ((u8
*)node_guid
)[5] = mac
[2];
1163 ((u8
*)node_guid
)[4] = 0xff;
1164 ((u8
*)node_guid
)[3] = 0xfe;
1165 ((u8
*)node_guid
)[2] = mac
[3];
1166 ((u8
*)node_guid
)[1] = mac
[4];
1167 ((u8
*)node_guid
)[0] = mac
[5];
1170 static int esw_vport_create_legacy_acl_tables(struct mlx5_eswitch
*esw
,
1171 struct mlx5_vport
*vport
)
1175 /* Only non manager vports need ACL in legacy mode */
1176 if (mlx5_esw_is_manager_vport(esw
, vport
->vport
))
1179 ret
= esw_acl_ingress_lgcy_setup(esw
, vport
);
1183 ret
= esw_acl_egress_lgcy_setup(esw
, vport
);
1190 esw_acl_ingress_lgcy_cleanup(esw
, vport
);
1195 static int esw_vport_setup_acl(struct mlx5_eswitch
*esw
,
1196 struct mlx5_vport
*vport
)
1198 if (esw
->mode
== MLX5_ESWITCH_LEGACY
)
1199 return esw_vport_create_legacy_acl_tables(esw
, vport
);
1201 return esw_vport_create_offloads_acl_tables(esw
, vport
);
1204 static void esw_vport_destroy_legacy_acl_tables(struct mlx5_eswitch
*esw
,
1205 struct mlx5_vport
*vport
)
1208 if (mlx5_esw_is_manager_vport(esw
, vport
->vport
))
1211 esw_acl_egress_lgcy_cleanup(esw
, vport
);
1212 esw_acl_ingress_lgcy_cleanup(esw
, vport
);
1215 static void esw_vport_cleanup_acl(struct mlx5_eswitch
*esw
,
1216 struct mlx5_vport
*vport
)
1218 if (esw
->mode
== MLX5_ESWITCH_LEGACY
)
1219 esw_vport_destroy_legacy_acl_tables(esw
, vport
);
1221 esw_vport_destroy_offloads_acl_tables(esw
, vport
);
1224 static int esw_vport_setup(struct mlx5_eswitch
*esw
, struct mlx5_vport
*vport
)
1226 u16 vport_num
= vport
->vport
;
1230 err
= esw_vport_setup_acl(esw
, vport
);
1234 /* Attach vport to the eswitch rate limiter */
1235 esw_vport_enable_qos(esw
, vport
, vport
->info
.max_rate
, vport
->qos
.bw_share
);
1237 if (mlx5_esw_is_manager_vport(esw
, vport_num
))
1240 mlx5_modify_vport_admin_state(esw
->dev
,
1241 MLX5_VPORT_STATE_OP_MOD_ESW_VPORT
,
1243 vport
->info
.link_state
);
1245 /* Host PF has its own mac/guid. */
1247 mlx5_modify_nic_vport_mac_address(esw
->dev
, vport_num
,
1249 mlx5_modify_nic_vport_node_guid(esw
->dev
, vport_num
,
1250 vport
->info
.node_guid
);
1253 flags
= (vport
->info
.vlan
|| vport
->info
.qos
) ?
1254 SET_VLAN_STRIP
| SET_VLAN_INSERT
: 0;
1255 modify_esw_vport_cvlan(esw
->dev
, vport_num
, vport
->info
.vlan
,
1256 vport
->info
.qos
, flags
);
1261 /* Don't cleanup vport->info, it's needed to restore vport configuration */
1262 static void esw_vport_cleanup(struct mlx5_eswitch
*esw
, struct mlx5_vport
*vport
)
1264 u16 vport_num
= vport
->vport
;
1266 if (!mlx5_esw_is_manager_vport(esw
, vport_num
))
1267 mlx5_modify_vport_admin_state(esw
->dev
,
1268 MLX5_VPORT_STATE_OP_MOD_ESW_VPORT
,
1270 MLX5_VPORT_ADMIN_STATE_DOWN
);
1272 esw_vport_disable_qos(esw
, vport
);
1273 esw_vport_cleanup_acl(esw
, vport
);
1276 static int esw_enable_vport(struct mlx5_eswitch
*esw
, u16 vport_num
,
1277 enum mlx5_eswitch_vport_event enabled_events
)
1279 struct mlx5_vport
*vport
;
1282 vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
1284 mutex_lock(&esw
->state_lock
);
1285 WARN_ON(vport
->enabled
);
1287 esw_debug(esw
->dev
, "Enabling VPORT(%d)\n", vport_num
);
1289 ret
= esw_vport_setup(esw
, vport
);
1293 /* Sync with current vport context */
1294 vport
->enabled_events
= enabled_events
;
1295 vport
->enabled
= true;
1297 /* Esw manager is trusted by default. Host PF (vport 0) is trusted as well
1298 * in smartNIC as it's a vport group manager.
1300 if (mlx5_esw_is_manager_vport(esw
, vport_num
) ||
1301 (!vport_num
&& mlx5_core_is_ecpf(esw
->dev
)))
1302 vport
->info
.trusted
= true;
1304 esw_vport_change_handle_locked(vport
);
1306 esw
->enabled_vports
++;
1307 esw_debug(esw
->dev
, "Enabled VPORT(%d)\n", vport_num
);
1309 mutex_unlock(&esw
->state_lock
);
1313 static void esw_disable_vport(struct mlx5_eswitch
*esw
, u16 vport_num
)
1315 struct mlx5_vport
*vport
;
1317 vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
1319 mutex_lock(&esw
->state_lock
);
1320 if (!vport
->enabled
)
1323 esw_debug(esw
->dev
, "Disabling vport(%d)\n", vport_num
);
1324 /* Mark this vport as disabled to discard new events */
1325 vport
->enabled
= false;
1327 /* Disable events from this vport */
1328 arm_vport_context_events_cmd(esw
->dev
, vport
->vport
, 0);
1329 /* We don't assume VFs will cleanup after themselves.
1330 * Calling vport change handler while vport is disabled will cleanup
1331 * the vport resources.
1333 esw_vport_change_handle_locked(vport
);
1334 vport
->enabled_events
= 0;
1335 esw_vport_cleanup(esw
, vport
);
1336 esw
->enabled_vports
--;
1339 mutex_unlock(&esw
->state_lock
);
1342 static int eswitch_vport_event(struct notifier_block
*nb
,
1343 unsigned long type
, void *data
)
1345 struct mlx5_eswitch
*esw
= mlx5_nb_cof(nb
, struct mlx5_eswitch
, nb
);
1346 struct mlx5_eqe
*eqe
= data
;
1347 struct mlx5_vport
*vport
;
1350 vport_num
= be16_to_cpu(eqe
->data
.vport_change
.vport_num
);
1351 vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
1353 queue_work(esw
->work_queue
, &vport
->vport_change_handler
);
1358 * mlx5_esw_query_functions - Returns raw output about functions state
1359 * @dev: Pointer to device to query
1361 * mlx5_esw_query_functions() allocates and returns functions changed
1362 * raw output memory pointer from device on success. Otherwise returns ERR_PTR.
1363 * Caller must free the memory using kvfree() when valid pointer is returned.
1365 const u32
*mlx5_esw_query_functions(struct mlx5_core_dev
*dev
)
1367 int outlen
= MLX5_ST_SZ_BYTES(query_esw_functions_out
);
1368 u32 in
[MLX5_ST_SZ_DW(query_esw_functions_in
)] = {};
1372 out
= kvzalloc(outlen
, GFP_KERNEL
);
1374 return ERR_PTR(-ENOMEM
);
1376 MLX5_SET(query_esw_functions_in
, in
, opcode
,
1377 MLX5_CMD_OP_QUERY_ESW_FUNCTIONS
);
1379 err
= mlx5_cmd_exec_inout(dev
, query_esw_functions
, in
, out
);
1384 return ERR_PTR(err
);
1387 static void mlx5_eswitch_event_handlers_register(struct mlx5_eswitch
*esw
)
1389 MLX5_NB_INIT(&esw
->nb
, eswitch_vport_event
, NIC_VPORT_CHANGE
);
1390 mlx5_eq_notifier_register(esw
->dev
, &esw
->nb
);
1392 if (esw
->mode
== MLX5_ESWITCH_OFFLOADS
&& mlx5_eswitch_is_funcs_handler(esw
->dev
)) {
1393 MLX5_NB_INIT(&esw
->esw_funcs
.nb
, mlx5_esw_funcs_changed_handler
,
1394 ESW_FUNCTIONS_CHANGED
);
1395 mlx5_eq_notifier_register(esw
->dev
, &esw
->esw_funcs
.nb
);
1399 static void mlx5_eswitch_event_handlers_unregister(struct mlx5_eswitch
*esw
)
1401 if (esw
->mode
== MLX5_ESWITCH_OFFLOADS
&& mlx5_eswitch_is_funcs_handler(esw
->dev
))
1402 mlx5_eq_notifier_unregister(esw
->dev
, &esw
->esw_funcs
.nb
);
1404 mlx5_eq_notifier_unregister(esw
->dev
, &esw
->nb
);
1406 flush_workqueue(esw
->work_queue
);
1409 static void mlx5_eswitch_clear_vf_vports_info(struct mlx5_eswitch
*esw
)
1411 struct mlx5_vport
*vport
;
1414 mlx5_esw_for_each_vf_vport(esw
, i
, vport
, esw
->esw_funcs
.num_vfs
) {
1415 memset(&vport
->qos
, 0, sizeof(vport
->qos
));
1416 memset(&vport
->info
, 0, sizeof(vport
->info
));
1417 vport
->info
.link_state
= MLX5_VPORT_ADMIN_STATE_AUTO
;
1421 /* Public E-Switch API */
1422 #define ESW_ALLOWED(esw) ((esw) && MLX5_ESWITCH_MANAGER((esw)->dev))
1424 int mlx5_eswitch_load_vport(struct mlx5_eswitch
*esw
, u16 vport_num
,
1425 enum mlx5_eswitch_vport_event enabled_events
)
1429 err
= esw_enable_vport(esw
, vport_num
, enabled_events
);
1433 err
= esw_offloads_load_rep(esw
, vport_num
);
1440 esw_disable_vport(esw
, vport_num
);
1444 void mlx5_eswitch_unload_vport(struct mlx5_eswitch
*esw
, u16 vport_num
)
1446 esw_offloads_unload_rep(esw
, vport_num
);
1447 esw_disable_vport(esw
, vport_num
);
1450 void mlx5_eswitch_unload_vf_vports(struct mlx5_eswitch
*esw
, u16 num_vfs
)
1454 mlx5_esw_for_each_vf_vport_num_reverse(esw
, i
, num_vfs
)
1455 mlx5_eswitch_unload_vport(esw
, i
);
1458 int mlx5_eswitch_load_vf_vports(struct mlx5_eswitch
*esw
, u16 num_vfs
,
1459 enum mlx5_eswitch_vport_event enabled_events
)
1464 mlx5_esw_for_each_vf_vport_num(esw
, i
, num_vfs
) {
1465 err
= mlx5_eswitch_load_vport(esw
, i
, enabled_events
);
1473 mlx5_eswitch_unload_vf_vports(esw
, i
- 1);
1477 static int host_pf_enable_hca(struct mlx5_core_dev
*dev
)
1479 if (!mlx5_core_is_ecpf(dev
))
1482 /* Once vport and representor are ready, take out the external host PF
1483 * out of initializing state. Enabling HCA clears the iser->initializing
1484 * bit and host PF driver loading can progress.
1486 return mlx5_cmd_host_pf_enable_hca(dev
);
1489 static void host_pf_disable_hca(struct mlx5_core_dev
*dev
)
1491 if (!mlx5_core_is_ecpf(dev
))
1494 mlx5_cmd_host_pf_disable_hca(dev
);
1497 /* mlx5_eswitch_enable_pf_vf_vports() enables vports of PF, ECPF and VFs
1498 * whichever are present on the eswitch.
1501 mlx5_eswitch_enable_pf_vf_vports(struct mlx5_eswitch
*esw
,
1502 enum mlx5_eswitch_vport_event enabled_events
)
1506 /* Enable PF vport */
1507 ret
= mlx5_eswitch_load_vport(esw
, MLX5_VPORT_PF
, enabled_events
);
1511 /* Enable external host PF HCA */
1512 ret
= host_pf_enable_hca(esw
->dev
);
1516 /* Enable ECPF vport */
1517 if (mlx5_ecpf_vport_exists(esw
->dev
)) {
1518 ret
= mlx5_eswitch_load_vport(esw
, MLX5_VPORT_ECPF
, enabled_events
);
1523 /* Enable VF vports */
1524 ret
= mlx5_eswitch_load_vf_vports(esw
, esw
->esw_funcs
.num_vfs
,
1531 if (mlx5_ecpf_vport_exists(esw
->dev
))
1532 mlx5_eswitch_unload_vport(esw
, MLX5_VPORT_ECPF
);
1534 host_pf_disable_hca(esw
->dev
);
1536 mlx5_eswitch_unload_vport(esw
, MLX5_VPORT_PF
);
1540 /* mlx5_eswitch_disable_pf_vf_vports() disables vports of PF, ECPF and VFs
1541 * whichever are previously enabled on the eswitch.
1543 void mlx5_eswitch_disable_pf_vf_vports(struct mlx5_eswitch
*esw
)
1545 mlx5_eswitch_unload_vf_vports(esw
, esw
->esw_funcs
.num_vfs
);
1547 if (mlx5_ecpf_vport_exists(esw
->dev
))
1548 mlx5_eswitch_unload_vport(esw
, MLX5_VPORT_ECPF
);
1550 host_pf_disable_hca(esw
->dev
);
1551 mlx5_eswitch_unload_vport(esw
, MLX5_VPORT_PF
);
1554 static void mlx5_eswitch_get_devlink_param(struct mlx5_eswitch
*esw
)
1556 struct devlink
*devlink
= priv_to_devlink(esw
->dev
);
1557 union devlink_param_value val
;
1560 err
= devlink_param_driverinit_value_get(devlink
,
1561 MLX5_DEVLINK_PARAM_ID_ESW_LARGE_GROUP_NUM
,
1564 esw
->params
.large_group_num
= val
.vu32
;
1567 "Devlink can't get param fdb_large_groups, uses default (%d).\n",
1568 ESW_OFFLOADS_DEFAULT_NUM_GROUPS
);
1569 esw
->params
.large_group_num
= ESW_OFFLOADS_DEFAULT_NUM_GROUPS
;
1574 mlx5_eswitch_update_num_of_vfs(struct mlx5_eswitch
*esw
, int num_vfs
)
1578 WARN_ON_ONCE(esw
->mode
!= MLX5_ESWITCH_NONE
);
1583 if (!mlx5_core_is_ecpf_esw_manager(esw
->dev
)) {
1584 esw
->esw_funcs
.num_vfs
= num_vfs
;
1588 out
= mlx5_esw_query_functions(esw
->dev
);
1592 esw
->esw_funcs
.num_vfs
= MLX5_GET(query_esw_functions_out
, out
,
1593 host_params_context
.host_num_of_vfs
);
1598 * mlx5_eswitch_enable_locked - Enable eswitch
1599 * @esw: Pointer to eswitch
1600 * @mode: Eswitch mode to enable
1601 * @num_vfs: Enable eswitch for given number of VFs. This is optional.
1602 * Valid value are 0, > 0 and MLX5_ESWITCH_IGNORE_NUM_VFS.
1603 * Caller should pass num_vfs > 0 when enabling eswitch for
1604 * vf vports. Caller should pass num_vfs = 0, when eswitch
1605 * is enabled without sriov VFs or when caller
1606 * is unaware of the sriov state of the host PF on ECPF based
1607 * eswitch. Caller should pass < 0 when num_vfs should be
1608 * completely ignored. This is typically the case when eswitch
1609 * is enabled without sriov regardless of PF/ECPF system.
1610 * mlx5_eswitch_enable_locked() Enables eswitch in either legacy or offloads
1611 * mode. If num_vfs >=0 is provided, it setup VF related eswitch vports.
1612 * It returns 0 on success or error code on failure.
1614 int mlx5_eswitch_enable_locked(struct mlx5_eswitch
*esw
, int mode
, int num_vfs
)
1618 lockdep_assert_held(&esw
->mode_lock
);
1620 if (!MLX5_CAP_ESW_FLOWTABLE_FDB(esw
->dev
, ft_support
)) {
1621 esw_warn(esw
->dev
, "FDB is not supported, aborting ...\n");
1625 if (!MLX5_CAP_ESW_INGRESS_ACL(esw
->dev
, ft_support
))
1626 esw_warn(esw
->dev
, "ingress ACL is not supported by FW\n");
1628 if (!MLX5_CAP_ESW_EGRESS_ACL(esw
->dev
, ft_support
))
1629 esw_warn(esw
->dev
, "engress ACL is not supported by FW\n");
1631 mlx5_eswitch_get_devlink_param(esw
);
1633 mlx5_eswitch_update_num_of_vfs(esw
, num_vfs
);
1635 esw_create_tsar(esw
);
1639 mlx5_lag_update(esw
->dev
);
1641 if (mode
== MLX5_ESWITCH_LEGACY
) {
1642 err
= esw_legacy_enable(esw
);
1644 mlx5_rescan_drivers(esw
->dev
);
1645 err
= esw_offloads_enable(esw
);
1651 mlx5_eswitch_event_handlers_register(esw
);
1653 esw_info(esw
->dev
, "Enable: mode(%s), nvfs(%d), active vports(%d)\n",
1654 mode
== MLX5_ESWITCH_LEGACY
? "LEGACY" : "OFFLOADS",
1655 esw
->esw_funcs
.num_vfs
, esw
->enabled_vports
);
1660 esw
->mode
= MLX5_ESWITCH_NONE
;
1662 if (mode
== MLX5_ESWITCH_OFFLOADS
)
1663 mlx5_rescan_drivers(esw
->dev
);
1665 esw_destroy_tsar(esw
);
1670 * mlx5_eswitch_enable - Enable eswitch
1671 * @esw: Pointer to eswitch
1672 * @num_vfs: Enable eswitch swich for given number of VFs.
1673 * Caller must pass num_vfs > 0 when enabling eswitch for
1675 * mlx5_eswitch_enable() returns 0 on success or error code on failure.
1677 int mlx5_eswitch_enable(struct mlx5_eswitch
*esw
, int num_vfs
)
1681 if (!ESW_ALLOWED(esw
))
1684 mutex_lock(&esw
->mode_lock
);
1685 if (esw
->mode
== MLX5_ESWITCH_NONE
) {
1686 ret
= mlx5_eswitch_enable_locked(esw
, MLX5_ESWITCH_LEGACY
, num_vfs
);
1688 enum mlx5_eswitch_vport_event vport_events
;
1690 vport_events
= (esw
->mode
== MLX5_ESWITCH_LEGACY
) ?
1691 MLX5_LEGACY_SRIOV_VPORT_EVENTS
: MLX5_VPORT_UC_ADDR_CHANGE
;
1692 ret
= mlx5_eswitch_load_vf_vports(esw
, num_vfs
, vport_events
);
1694 esw
->esw_funcs
.num_vfs
= num_vfs
;
1696 mutex_unlock(&esw
->mode_lock
);
1700 void mlx5_eswitch_disable_locked(struct mlx5_eswitch
*esw
, bool clear_vf
)
1704 lockdep_assert_held_write(&esw
->mode_lock
);
1706 if (esw
->mode
== MLX5_ESWITCH_NONE
)
1709 esw_info(esw
->dev
, "Disable: mode(%s), nvfs(%d), active vports(%d)\n",
1710 esw
->mode
== MLX5_ESWITCH_LEGACY
? "LEGACY" : "OFFLOADS",
1711 esw
->esw_funcs
.num_vfs
, esw
->enabled_vports
);
1713 mlx5_eswitch_event_handlers_unregister(esw
);
1715 if (esw
->mode
== MLX5_ESWITCH_LEGACY
)
1716 esw_legacy_disable(esw
);
1717 else if (esw
->mode
== MLX5_ESWITCH_OFFLOADS
)
1718 esw_offloads_disable(esw
);
1720 old_mode
= esw
->mode
;
1721 esw
->mode
= MLX5_ESWITCH_NONE
;
1723 mlx5_lag_update(esw
->dev
);
1725 if (old_mode
== MLX5_ESWITCH_OFFLOADS
)
1726 mlx5_rescan_drivers(esw
->dev
);
1728 esw_destroy_tsar(esw
);
1731 mlx5_eswitch_clear_vf_vports_info(esw
);
1734 void mlx5_eswitch_disable(struct mlx5_eswitch
*esw
, bool clear_vf
)
1736 if (!ESW_ALLOWED(esw
))
1739 mutex_lock(&esw
->mode_lock
);
1740 mlx5_eswitch_disable_locked(esw
, clear_vf
);
1741 esw
->esw_funcs
.num_vfs
= 0;
1742 mutex_unlock(&esw
->mode_lock
);
1745 int mlx5_eswitch_init(struct mlx5_core_dev
*dev
)
1747 struct mlx5_eswitch
*esw
;
1748 struct mlx5_vport
*vport
;
1752 if (!MLX5_VPORT_MANAGER(dev
))
1755 total_vports
= mlx5_eswitch_get_total_vports(dev
);
1758 "Total vports %d, per vport: max uc(%d) max mc(%d)\n",
1760 MLX5_MAX_UC_PER_VPORT(dev
),
1761 MLX5_MAX_MC_PER_VPORT(dev
));
1763 esw
= kzalloc(sizeof(*esw
), GFP_KERNEL
);
1768 esw
->manager_vport
= mlx5_eswitch_manager_vport(dev
);
1769 esw
->first_host_vport
= mlx5_eswitch_first_host_vport_num(dev
);
1771 esw
->work_queue
= create_singlethread_workqueue("mlx5_esw_wq");
1772 if (!esw
->work_queue
) {
1777 esw
->vports
= kcalloc(total_vports
, sizeof(struct mlx5_vport
),
1784 esw
->total_vports
= total_vports
;
1786 err
= esw_offloads_init_reps(esw
);
1790 mutex_init(&esw
->offloads
.encap_tbl_lock
);
1791 hash_init(esw
->offloads
.encap_tbl
);
1792 mutex_init(&esw
->offloads
.decap_tbl_lock
);
1793 hash_init(esw
->offloads
.decap_tbl
);
1794 mlx5e_mod_hdr_tbl_init(&esw
->offloads
.mod_hdr
);
1795 atomic64_set(&esw
->offloads
.num_flows
, 0);
1796 ida_init(&esw
->offloads
.vport_metadata_ida
);
1797 mutex_init(&esw
->state_lock
);
1798 mutex_init(&esw
->mode_lock
);
1800 mlx5_esw_for_all_vports(esw
, i
, vport
) {
1801 vport
->vport
= mlx5_eswitch_index_to_vport_num(esw
, i
);
1802 vport
->info
.link_state
= MLX5_VPORT_ADMIN_STATE_AUTO
;
1804 INIT_WORK(&vport
->vport_change_handler
,
1805 esw_vport_change_handler
);
1808 esw
->enabled_vports
= 0;
1809 esw
->mode
= MLX5_ESWITCH_NONE
;
1810 esw
->offloads
.inline_mode
= MLX5_INLINE_MODE_NONE
;
1812 dev
->priv
.eswitch
= esw
;
1815 if (esw
->work_queue
)
1816 destroy_workqueue(esw
->work_queue
);
1817 esw_offloads_cleanup_reps(esw
);
1823 void mlx5_eswitch_cleanup(struct mlx5_eswitch
*esw
)
1825 if (!esw
|| !MLX5_VPORT_MANAGER(esw
->dev
))
1828 esw_info(esw
->dev
, "cleanup\n");
1830 esw
->dev
->priv
.eswitch
= NULL
;
1831 destroy_workqueue(esw
->work_queue
);
1832 esw_offloads_cleanup_reps(esw
);
1833 mutex_destroy(&esw
->mode_lock
);
1834 mutex_destroy(&esw
->state_lock
);
1835 ida_destroy(&esw
->offloads
.vport_metadata_ida
);
1836 mlx5e_mod_hdr_tbl_destroy(&esw
->offloads
.mod_hdr
);
1837 mutex_destroy(&esw
->offloads
.encap_tbl_lock
);
1838 mutex_destroy(&esw
->offloads
.decap_tbl_lock
);
1843 /* Vport Administration */
1845 mlx5_esw_set_vport_mac_locked(struct mlx5_eswitch
*esw
,
1846 struct mlx5_vport
*evport
, const u8
*mac
)
1848 u16 vport_num
= evport
->vport
;
1852 if (is_multicast_ether_addr(mac
))
1855 if (evport
->info
.spoofchk
&& !is_valid_ether_addr(mac
))
1856 mlx5_core_warn(esw
->dev
,
1857 "Set invalid MAC while spoofchk is on, vport(%d)\n",
1860 err
= mlx5_modify_nic_vport_mac_address(esw
->dev
, vport_num
, mac
);
1862 mlx5_core_warn(esw
->dev
,
1863 "Failed to mlx5_modify_nic_vport_mac vport(%d) err=(%d)\n",
1868 node_guid_gen_from_mac(&node_guid
, mac
);
1869 err
= mlx5_modify_nic_vport_node_guid(esw
->dev
, vport_num
, node_guid
);
1871 mlx5_core_warn(esw
->dev
,
1872 "Failed to set vport %d node guid, err = %d. RDMA_CM will not function properly for this VF.\n",
1875 ether_addr_copy(evport
->info
.mac
, mac
);
1876 evport
->info
.node_guid
= node_guid
;
1877 if (evport
->enabled
&& esw
->mode
== MLX5_ESWITCH_LEGACY
)
1878 err
= esw_acl_ingress_lgcy_setup(esw
, evport
);
1883 int mlx5_eswitch_set_vport_mac(struct mlx5_eswitch
*esw
,
1884 u16 vport
, const u8
*mac
)
1886 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
1890 return PTR_ERR(evport
);
1892 mutex_lock(&esw
->state_lock
);
1893 err
= mlx5_esw_set_vport_mac_locked(esw
, evport
, mac
);
1894 mutex_unlock(&esw
->state_lock
);
1899 is_port_function_supported(const struct mlx5_eswitch
*esw
, u16 vport_num
)
1901 return vport_num
== MLX5_VPORT_PF
||
1902 mlx5_eswitch_is_vf_vport(esw
, vport_num
);
1905 int mlx5_devlink_port_function_hw_addr_get(struct devlink
*devlink
,
1906 struct devlink_port
*port
,
1907 u8
*hw_addr
, int *hw_addr_len
,
1908 struct netlink_ext_ack
*extack
)
1910 struct mlx5_eswitch
*esw
;
1911 struct mlx5_vport
*vport
;
1912 int err
= -EOPNOTSUPP
;
1915 esw
= mlx5_devlink_eswitch_get(devlink
);
1917 return PTR_ERR(esw
);
1919 vport_num
= mlx5_esw_devlink_port_index_to_vport_num(port
->index
);
1920 if (!is_port_function_supported(esw
, vport_num
))
1923 vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
1924 if (IS_ERR(vport
)) {
1925 NL_SET_ERR_MSG_MOD(extack
, "Invalid port");
1926 return PTR_ERR(vport
);
1929 mutex_lock(&esw
->state_lock
);
1930 if (vport
->enabled
) {
1931 ether_addr_copy(hw_addr
, vport
->info
.mac
);
1932 *hw_addr_len
= ETH_ALEN
;
1935 mutex_unlock(&esw
->state_lock
);
1939 int mlx5_devlink_port_function_hw_addr_set(struct devlink
*devlink
,
1940 struct devlink_port
*port
,
1941 const u8
*hw_addr
, int hw_addr_len
,
1942 struct netlink_ext_ack
*extack
)
1944 struct mlx5_eswitch
*esw
;
1945 struct mlx5_vport
*vport
;
1946 int err
= -EOPNOTSUPP
;
1949 esw
= mlx5_devlink_eswitch_get(devlink
);
1951 NL_SET_ERR_MSG_MOD(extack
, "Eswitch doesn't support set hw_addr");
1952 return PTR_ERR(esw
);
1955 vport_num
= mlx5_esw_devlink_port_index_to_vport_num(port
->index
);
1956 if (!is_port_function_supported(esw
, vport_num
)) {
1957 NL_SET_ERR_MSG_MOD(extack
, "Port doesn't support set hw_addr");
1960 vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
1961 if (IS_ERR(vport
)) {
1962 NL_SET_ERR_MSG_MOD(extack
, "Invalid port");
1963 return PTR_ERR(vport
);
1966 mutex_lock(&esw
->state_lock
);
1968 err
= mlx5_esw_set_vport_mac_locked(esw
, vport
, hw_addr
);
1970 NL_SET_ERR_MSG_MOD(extack
, "Eswitch vport is disabled");
1971 mutex_unlock(&esw
->state_lock
);
1975 int mlx5_eswitch_set_vport_state(struct mlx5_eswitch
*esw
,
1976 u16 vport
, int link_state
)
1978 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
1979 int opmod
= MLX5_VPORT_STATE_OP_MOD_ESW_VPORT
;
1980 int other_vport
= 1;
1983 if (!ESW_ALLOWED(esw
))
1986 return PTR_ERR(evport
);
1988 if (vport
== MLX5_VPORT_UPLINK
) {
1989 opmod
= MLX5_VPORT_STATE_OP_MOD_UPLINK
;
1993 mutex_lock(&esw
->state_lock
);
1995 err
= mlx5_modify_vport_admin_state(esw
->dev
, opmod
, vport
, other_vport
, link_state
);
1997 mlx5_core_warn(esw
->dev
, "Failed to set vport %d link state, opmod = %d, err = %d",
2002 evport
->info
.link_state
= link_state
;
2005 mutex_unlock(&esw
->state_lock
);
2009 int mlx5_eswitch_get_vport_config(struct mlx5_eswitch
*esw
,
2010 u16 vport
, struct ifla_vf_info
*ivi
)
2012 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
2015 return PTR_ERR(evport
);
2017 memset(ivi
, 0, sizeof(*ivi
));
2018 ivi
->vf
= vport
- 1;
2020 mutex_lock(&esw
->state_lock
);
2021 ether_addr_copy(ivi
->mac
, evport
->info
.mac
);
2022 ivi
->linkstate
= evport
->info
.link_state
;
2023 ivi
->vlan
= evport
->info
.vlan
;
2024 ivi
->qos
= evport
->info
.qos
;
2025 ivi
->spoofchk
= evport
->info
.spoofchk
;
2026 ivi
->trusted
= evport
->info
.trusted
;
2027 ivi
->min_tx_rate
= evport
->info
.min_rate
;
2028 ivi
->max_tx_rate
= evport
->info
.max_rate
;
2029 mutex_unlock(&esw
->state_lock
);
2034 int __mlx5_eswitch_set_vport_vlan(struct mlx5_eswitch
*esw
,
2035 u16 vport
, u16 vlan
, u8 qos
, u8 set_flags
)
2037 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
2041 return PTR_ERR(evport
);
2042 if (vlan
> 4095 || qos
> 7)
2045 err
= modify_esw_vport_cvlan(esw
->dev
, vport
, vlan
, qos
, set_flags
);
2049 evport
->info
.vlan
= vlan
;
2050 evport
->info
.qos
= qos
;
2051 if (evport
->enabled
&& esw
->mode
== MLX5_ESWITCH_LEGACY
) {
2052 err
= esw_acl_ingress_lgcy_setup(esw
, evport
);
2055 err
= esw_acl_egress_lgcy_setup(esw
, evport
);
2061 int mlx5_eswitch_set_vport_vlan(struct mlx5_eswitch
*esw
,
2062 u16 vport
, u16 vlan
, u8 qos
)
2067 if (!ESW_ALLOWED(esw
))
2071 set_flags
= SET_VLAN_STRIP
| SET_VLAN_INSERT
;
2073 mutex_lock(&esw
->state_lock
);
2074 err
= __mlx5_eswitch_set_vport_vlan(esw
, vport
, vlan
, qos
, set_flags
);
2075 mutex_unlock(&esw
->state_lock
);
2080 int mlx5_eswitch_set_vport_spoofchk(struct mlx5_eswitch
*esw
,
2081 u16 vport
, bool spoofchk
)
2083 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
2087 if (!ESW_ALLOWED(esw
))
2090 return PTR_ERR(evport
);
2092 mutex_lock(&esw
->state_lock
);
2093 pschk
= evport
->info
.spoofchk
;
2094 evport
->info
.spoofchk
= spoofchk
;
2095 if (pschk
&& !is_valid_ether_addr(evport
->info
.mac
))
2096 mlx5_core_warn(esw
->dev
,
2097 "Spoofchk in set while MAC is invalid, vport(%d)\n",
2099 if (evport
->enabled
&& esw
->mode
== MLX5_ESWITCH_LEGACY
)
2100 err
= esw_acl_ingress_lgcy_setup(esw
, evport
);
2102 evport
->info
.spoofchk
= pschk
;
2103 mutex_unlock(&esw
->state_lock
);
2108 static void esw_cleanup_vepa_rules(struct mlx5_eswitch
*esw
)
2110 if (esw
->fdb_table
.legacy
.vepa_uplink_rule
)
2111 mlx5_del_flow_rules(esw
->fdb_table
.legacy
.vepa_uplink_rule
);
2113 if (esw
->fdb_table
.legacy
.vepa_star_rule
)
2114 mlx5_del_flow_rules(esw
->fdb_table
.legacy
.vepa_star_rule
);
2116 esw
->fdb_table
.legacy
.vepa_uplink_rule
= NULL
;
2117 esw
->fdb_table
.legacy
.vepa_star_rule
= NULL
;
2120 static int _mlx5_eswitch_set_vepa_locked(struct mlx5_eswitch
*esw
,
2123 struct mlx5_flow_destination dest
= {};
2124 struct mlx5_flow_act flow_act
= {};
2125 struct mlx5_flow_handle
*flow_rule
;
2126 struct mlx5_flow_spec
*spec
;
2131 esw_cleanup_vepa_rules(esw
);
2135 if (esw
->fdb_table
.legacy
.vepa_uplink_rule
)
2138 spec
= kvzalloc(sizeof(*spec
), GFP_KERNEL
);
2142 /* Uplink rule forward uplink traffic to FDB */
2143 misc
= MLX5_ADDR_OF(fte_match_param
, spec
->match_value
, misc_parameters
);
2144 MLX5_SET(fte_match_set_misc
, misc
, source_port
, MLX5_VPORT_UPLINK
);
2146 misc
= MLX5_ADDR_OF(fte_match_param
, spec
->match_criteria
, misc_parameters
);
2147 MLX5_SET_TO_ONES(fte_match_set_misc
, misc
, source_port
);
2149 spec
->match_criteria_enable
= MLX5_MATCH_MISC_PARAMETERS
;
2150 dest
.type
= MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE
;
2151 dest
.ft
= esw
->fdb_table
.legacy
.fdb
;
2152 flow_act
.action
= MLX5_FLOW_CONTEXT_ACTION_FWD_DEST
;
2153 flow_rule
= mlx5_add_flow_rules(esw
->fdb_table
.legacy
.vepa_fdb
, spec
,
2154 &flow_act
, &dest
, 1);
2155 if (IS_ERR(flow_rule
)) {
2156 err
= PTR_ERR(flow_rule
);
2159 esw
->fdb_table
.legacy
.vepa_uplink_rule
= flow_rule
;
2162 /* Star rule to forward all traffic to uplink vport */
2163 memset(&dest
, 0, sizeof(dest
));
2164 dest
.type
= MLX5_FLOW_DESTINATION_TYPE_VPORT
;
2165 dest
.vport
.num
= MLX5_VPORT_UPLINK
;
2166 flow_act
.action
= MLX5_FLOW_CONTEXT_ACTION_FWD_DEST
;
2167 flow_rule
= mlx5_add_flow_rules(esw
->fdb_table
.legacy
.vepa_fdb
, NULL
,
2168 &flow_act
, &dest
, 1);
2169 if (IS_ERR(flow_rule
)) {
2170 err
= PTR_ERR(flow_rule
);
2173 esw
->fdb_table
.legacy
.vepa_star_rule
= flow_rule
;
2179 esw_cleanup_vepa_rules(esw
);
2183 int mlx5_eswitch_set_vepa(struct mlx5_eswitch
*esw
, u8 setting
)
2190 if (!ESW_ALLOWED(esw
))
2193 mutex_lock(&esw
->state_lock
);
2194 if (esw
->mode
!= MLX5_ESWITCH_LEGACY
) {
2199 err
= _mlx5_eswitch_set_vepa_locked(esw
, setting
);
2202 mutex_unlock(&esw
->state_lock
);
2206 int mlx5_eswitch_get_vepa(struct mlx5_eswitch
*esw
, u8
*setting
)
2211 if (!ESW_ALLOWED(esw
))
2214 if (esw
->mode
!= MLX5_ESWITCH_LEGACY
)
2217 *setting
= esw
->fdb_table
.legacy
.vepa_uplink_rule
? 1 : 0;
2221 int mlx5_eswitch_set_vport_trust(struct mlx5_eswitch
*esw
,
2222 u16 vport
, bool setting
)
2224 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
2226 if (!ESW_ALLOWED(esw
))
2229 return PTR_ERR(evport
);
2231 mutex_lock(&esw
->state_lock
);
2232 evport
->info
.trusted
= setting
;
2233 if (evport
->enabled
)
2234 esw_vport_change_handle_locked(evport
);
2235 mutex_unlock(&esw
->state_lock
);
2240 static u32
calculate_vports_min_rate_divider(struct mlx5_eswitch
*esw
)
2242 u32 fw_max_bw_share
= MLX5_CAP_QOS(esw
->dev
, max_tsar_bw_share
);
2243 struct mlx5_vport
*evport
;
2244 u32 max_guarantee
= 0;
2247 mlx5_esw_for_all_vports(esw
, i
, evport
) {
2248 if (!evport
->enabled
|| evport
->info
.min_rate
< max_guarantee
)
2250 max_guarantee
= evport
->info
.min_rate
;
2254 return max_t(u32
, max_guarantee
/ fw_max_bw_share
, 1);
2258 static int normalize_vports_min_rate(struct mlx5_eswitch
*esw
)
2260 u32 fw_max_bw_share
= MLX5_CAP_QOS(esw
->dev
, max_tsar_bw_share
);
2261 u32 divider
= calculate_vports_min_rate_divider(esw
);
2262 struct mlx5_vport
*evport
;
2269 mlx5_esw_for_all_vports(esw
, i
, evport
) {
2270 if (!evport
->enabled
)
2272 vport_min_rate
= evport
->info
.min_rate
;
2273 vport_max_rate
= evport
->info
.max_rate
;
2277 bw_share
= MLX5_RATE_TO_BW_SHARE(vport_min_rate
,
2281 if (bw_share
== evport
->qos
.bw_share
)
2284 err
= esw_vport_qos_config(esw
, evport
, vport_max_rate
,
2287 evport
->qos
.bw_share
= bw_share
;
2295 int mlx5_eswitch_set_vport_rate(struct mlx5_eswitch
*esw
, u16 vport
,
2296 u32 max_rate
, u32 min_rate
)
2298 struct mlx5_vport
*evport
= mlx5_eswitch_get_vport(esw
, vport
);
2299 u32 fw_max_bw_share
;
2300 u32 previous_min_rate
;
2301 bool min_rate_supported
;
2302 bool max_rate_supported
;
2305 if (!ESW_ALLOWED(esw
))
2308 return PTR_ERR(evport
);
2310 fw_max_bw_share
= MLX5_CAP_QOS(esw
->dev
, max_tsar_bw_share
);
2311 min_rate_supported
= MLX5_CAP_QOS(esw
->dev
, esw_bw_share
) &&
2312 fw_max_bw_share
>= MLX5_MIN_BW_SHARE
;
2313 max_rate_supported
= MLX5_CAP_QOS(esw
->dev
, esw_rate_limit
);
2315 if ((min_rate
&& !min_rate_supported
) || (max_rate
&& !max_rate_supported
))
2318 mutex_lock(&esw
->state_lock
);
2320 if (min_rate
== evport
->info
.min_rate
)
2323 previous_min_rate
= evport
->info
.min_rate
;
2324 evport
->info
.min_rate
= min_rate
;
2325 err
= normalize_vports_min_rate(esw
);
2327 evport
->info
.min_rate
= previous_min_rate
;
2332 if (max_rate
== evport
->info
.max_rate
)
2335 err
= esw_vport_qos_config(esw
, evport
, max_rate
, evport
->qos
.bw_share
);
2337 evport
->info
.max_rate
= max_rate
;
2340 mutex_unlock(&esw
->state_lock
);
2344 static int mlx5_eswitch_query_vport_drop_stats(struct mlx5_core_dev
*dev
,
2345 struct mlx5_vport
*vport
,
2346 struct mlx5_vport_drop_stats
*stats
)
2348 struct mlx5_eswitch
*esw
= dev
->priv
.eswitch
;
2349 u64 rx_discard_vport_down
, tx_discard_vport_down
;
2353 if (esw
->mode
!= MLX5_ESWITCH_LEGACY
)
2356 mutex_lock(&esw
->state_lock
);
2357 if (!vport
->enabled
)
2360 if (!IS_ERR_OR_NULL(vport
->egress
.legacy
.drop_counter
))
2361 mlx5_fc_query(dev
, vport
->egress
.legacy
.drop_counter
,
2362 &stats
->rx_dropped
, &bytes
);
2364 if (vport
->ingress
.legacy
.drop_counter
)
2365 mlx5_fc_query(dev
, vport
->ingress
.legacy
.drop_counter
,
2366 &stats
->tx_dropped
, &bytes
);
2368 if (!MLX5_CAP_GEN(dev
, receive_discard_vport_down
) &&
2369 !MLX5_CAP_GEN(dev
, transmit_discard_vport_down
))
2372 err
= mlx5_query_vport_down_stats(dev
, vport
->vport
, 1,
2373 &rx_discard_vport_down
,
2374 &tx_discard_vport_down
);
2378 if (MLX5_CAP_GEN(dev
, receive_discard_vport_down
))
2379 stats
->rx_dropped
+= rx_discard_vport_down
;
2380 if (MLX5_CAP_GEN(dev
, transmit_discard_vport_down
))
2381 stats
->tx_dropped
+= tx_discard_vport_down
;
2384 mutex_unlock(&esw
->state_lock
);
2388 int mlx5_eswitch_get_vport_stats(struct mlx5_eswitch
*esw
,
2390 struct ifla_vf_stats
*vf_stats
)
2392 struct mlx5_vport
*vport
= mlx5_eswitch_get_vport(esw
, vport_num
);
2393 int outlen
= MLX5_ST_SZ_BYTES(query_vport_counter_out
);
2394 u32 in
[MLX5_ST_SZ_DW(query_vport_counter_in
)] = {};
2395 struct mlx5_vport_drop_stats stats
= {};
2400 return PTR_ERR(vport
);
2402 out
= kvzalloc(outlen
, GFP_KERNEL
);
2406 MLX5_SET(query_vport_counter_in
, in
, opcode
,
2407 MLX5_CMD_OP_QUERY_VPORT_COUNTER
);
2408 MLX5_SET(query_vport_counter_in
, in
, op_mod
, 0);
2409 MLX5_SET(query_vport_counter_in
, in
, vport_number
, vport
->vport
);
2410 MLX5_SET(query_vport_counter_in
, in
, other_vport
, 1);
2412 err
= mlx5_cmd_exec_inout(esw
->dev
, query_vport_counter
, in
, out
);
2416 #define MLX5_GET_CTR(p, x) \
2417 MLX5_GET64(query_vport_counter_out, p, x)
2419 memset(vf_stats
, 0, sizeof(*vf_stats
));
2420 vf_stats
->rx_packets
=
2421 MLX5_GET_CTR(out
, received_eth_unicast
.packets
) +
2422 MLX5_GET_CTR(out
, received_ib_unicast
.packets
) +
2423 MLX5_GET_CTR(out
, received_eth_multicast
.packets
) +
2424 MLX5_GET_CTR(out
, received_ib_multicast
.packets
) +
2425 MLX5_GET_CTR(out
, received_eth_broadcast
.packets
);
2427 vf_stats
->rx_bytes
=
2428 MLX5_GET_CTR(out
, received_eth_unicast
.octets
) +
2429 MLX5_GET_CTR(out
, received_ib_unicast
.octets
) +
2430 MLX5_GET_CTR(out
, received_eth_multicast
.octets
) +
2431 MLX5_GET_CTR(out
, received_ib_multicast
.octets
) +
2432 MLX5_GET_CTR(out
, received_eth_broadcast
.octets
);
2434 vf_stats
->tx_packets
=
2435 MLX5_GET_CTR(out
, transmitted_eth_unicast
.packets
) +
2436 MLX5_GET_CTR(out
, transmitted_ib_unicast
.packets
) +
2437 MLX5_GET_CTR(out
, transmitted_eth_multicast
.packets
) +
2438 MLX5_GET_CTR(out
, transmitted_ib_multicast
.packets
) +
2439 MLX5_GET_CTR(out
, transmitted_eth_broadcast
.packets
);
2441 vf_stats
->tx_bytes
=
2442 MLX5_GET_CTR(out
, transmitted_eth_unicast
.octets
) +
2443 MLX5_GET_CTR(out
, transmitted_ib_unicast
.octets
) +
2444 MLX5_GET_CTR(out
, transmitted_eth_multicast
.octets
) +
2445 MLX5_GET_CTR(out
, transmitted_ib_multicast
.octets
) +
2446 MLX5_GET_CTR(out
, transmitted_eth_broadcast
.octets
);
2448 vf_stats
->multicast
=
2449 MLX5_GET_CTR(out
, received_eth_multicast
.packets
) +
2450 MLX5_GET_CTR(out
, received_ib_multicast
.packets
);
2452 vf_stats
->broadcast
=
2453 MLX5_GET_CTR(out
, received_eth_broadcast
.packets
);
2455 err
= mlx5_eswitch_query_vport_drop_stats(esw
->dev
, vport
, &stats
);
2458 vf_stats
->rx_dropped
= stats
.rx_dropped
;
2459 vf_stats
->tx_dropped
= stats
.tx_dropped
;
2466 u8
mlx5_eswitch_mode(struct mlx5_core_dev
*dev
)
2468 struct mlx5_eswitch
*esw
= dev
->priv
.eswitch
;
2470 return ESW_ALLOWED(esw
) ? esw
->mode
: MLX5_ESWITCH_NONE
;
2472 EXPORT_SYMBOL_GPL(mlx5_eswitch_mode
);
2474 enum devlink_eswitch_encap_mode
2475 mlx5_eswitch_get_encap_mode(const struct mlx5_core_dev
*dev
)
2477 struct mlx5_eswitch
*esw
;
2479 esw
= dev
->priv
.eswitch
;
2480 return ESW_ALLOWED(esw
) ? esw
->offloads
.encap
:
2481 DEVLINK_ESWITCH_ENCAP_MODE_NONE
;
2483 EXPORT_SYMBOL(mlx5_eswitch_get_encap_mode
);
2485 bool mlx5_esw_lag_prereq(struct mlx5_core_dev
*dev0
, struct mlx5_core_dev
*dev1
)
2487 if ((dev0
->priv
.eswitch
->mode
== MLX5_ESWITCH_NONE
&&
2488 dev1
->priv
.eswitch
->mode
== MLX5_ESWITCH_NONE
) ||
2489 (dev0
->priv
.eswitch
->mode
== MLX5_ESWITCH_OFFLOADS
&&
2490 dev1
->priv
.eswitch
->mode
== MLX5_ESWITCH_OFFLOADS
))
2496 bool mlx5_esw_multipath_prereq(struct mlx5_core_dev
*dev0
,
2497 struct mlx5_core_dev
*dev1
)
2499 return (dev0
->priv
.eswitch
->mode
== MLX5_ESWITCH_OFFLOADS
&&
2500 dev1
->priv
.eswitch
->mode
== MLX5_ESWITCH_OFFLOADS
);