1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * net/switchdev/switchdev.c - Switch device API
4 * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
5 * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
8 #include <linux/kernel.h>
9 #include <linux/types.h>
10 #include <linux/init.h>
11 #include <linux/mutex.h>
12 #include <linux/notifier.h>
13 #include <linux/netdevice.h>
14 #include <linux/etherdevice.h>
15 #include <linux/if_bridge.h>
16 #include <linux/list.h>
17 #include <linux/workqueue.h>
18 #include <linux/if_vlan.h>
19 #include <linux/rtnetlink.h>
20 #include <net/switchdev.h>
22 static LIST_HEAD(deferred
);
23 static DEFINE_SPINLOCK(deferred_lock
);
25 typedef void switchdev_deferred_func_t(struct net_device
*dev
,
28 struct switchdev_deferred_item
{
29 struct list_head list
;
30 struct net_device
*dev
;
31 switchdev_deferred_func_t
*func
;
35 static struct switchdev_deferred_item
*switchdev_deferred_dequeue(void)
37 struct switchdev_deferred_item
*dfitem
;
39 spin_lock_bh(&deferred_lock
);
40 if (list_empty(&deferred
)) {
44 dfitem
= list_first_entry(&deferred
,
45 struct switchdev_deferred_item
, list
);
46 list_del(&dfitem
->list
);
48 spin_unlock_bh(&deferred_lock
);
53 * switchdev_deferred_process - Process ops in deferred queue
55 * Called to flush the ops currently queued in deferred ops queue.
56 * rtnl_lock must be held.
58 void switchdev_deferred_process(void)
60 struct switchdev_deferred_item
*dfitem
;
64 while ((dfitem
= switchdev_deferred_dequeue())) {
65 dfitem
->func(dfitem
->dev
, dfitem
->data
);
70 EXPORT_SYMBOL_GPL(switchdev_deferred_process
);
72 static void switchdev_deferred_process_work(struct work_struct
*work
)
75 switchdev_deferred_process();
79 static DECLARE_WORK(deferred_process_work
, switchdev_deferred_process_work
);
81 static int switchdev_deferred_enqueue(struct net_device
*dev
,
82 const void *data
, size_t data_len
,
83 switchdev_deferred_func_t
*func
)
85 struct switchdev_deferred_item
*dfitem
;
87 dfitem
= kmalloc(sizeof(*dfitem
) + data_len
, GFP_ATOMIC
);
92 memcpy(dfitem
->data
, data
, data_len
);
94 spin_lock_bh(&deferred_lock
);
95 list_add_tail(&dfitem
->list
, &deferred
);
96 spin_unlock_bh(&deferred_lock
);
97 schedule_work(&deferred_process_work
);
101 static int switchdev_port_attr_notify(enum switchdev_notifier_type nt
,
102 struct net_device
*dev
,
103 const struct switchdev_attr
*attr
,
104 struct switchdev_trans
*trans
)
109 struct switchdev_notifier_port_attr_info attr_info
= {
115 rc
= call_switchdev_blocking_notifiers(nt
, dev
,
116 &attr_info
.info
, NULL
);
117 err
= notifier_to_errno(rc
);
119 WARN_ON(!attr_info
.handled
);
123 if (!attr_info
.handled
)
129 static int switchdev_port_attr_set_now(struct net_device
*dev
,
130 const struct switchdev_attr
*attr
)
132 struct switchdev_trans trans
;
135 /* Phase I: prepare for attr set. Driver/device should fail
136 * here if there are going to be issues in the commit phase,
137 * such as lack of resources or support. The driver/device
138 * should reserve resources needed for the commit phase here,
139 * but should not commit the attr.
142 trans
.ph_prepare
= true;
143 err
= switchdev_port_attr_notify(SWITCHDEV_PORT_ATTR_SET
, dev
, attr
,
148 /* Phase II: commit attr set. This cannot fail as a fault
149 * of driver/device. If it does, it's a bug in the driver/device
150 * because the driver said everythings was OK in phase I.
153 trans
.ph_prepare
= false;
154 err
= switchdev_port_attr_notify(SWITCHDEV_PORT_ATTR_SET
, dev
, attr
,
156 WARN(err
, "%s: Commit of attribute (id=%d) failed.\n",
157 dev
->name
, attr
->id
);
162 static void switchdev_port_attr_set_deferred(struct net_device
*dev
,
165 const struct switchdev_attr
*attr
= data
;
168 err
= switchdev_port_attr_set_now(dev
, attr
);
169 if (err
&& err
!= -EOPNOTSUPP
)
170 netdev_err(dev
, "failed (err=%d) to set attribute (id=%d)\n",
173 attr
->complete(dev
, err
, attr
->complete_priv
);
176 static int switchdev_port_attr_set_defer(struct net_device
*dev
,
177 const struct switchdev_attr
*attr
)
179 return switchdev_deferred_enqueue(dev
, attr
, sizeof(*attr
),
180 switchdev_port_attr_set_deferred
);
184 * switchdev_port_attr_set - Set port attribute
187 * @attr: attribute to set
189 * Use a 2-phase prepare-commit transaction model to ensure
190 * system is not left in a partially updated state due to
191 * failure from driver/device.
193 * rtnl_lock must be held and must not be in atomic section,
194 * in case SWITCHDEV_F_DEFER flag is not set.
196 int switchdev_port_attr_set(struct net_device
*dev
,
197 const struct switchdev_attr
*attr
)
199 if (attr
->flags
& SWITCHDEV_F_DEFER
)
200 return switchdev_port_attr_set_defer(dev
, attr
);
202 return switchdev_port_attr_set_now(dev
, attr
);
204 EXPORT_SYMBOL_GPL(switchdev_port_attr_set
);
206 static size_t switchdev_obj_size(const struct switchdev_obj
*obj
)
209 case SWITCHDEV_OBJ_ID_PORT_VLAN
:
210 return sizeof(struct switchdev_obj_port_vlan
);
211 case SWITCHDEV_OBJ_ID_PORT_MDB
:
212 return sizeof(struct switchdev_obj_port_mdb
);
213 case SWITCHDEV_OBJ_ID_HOST_MDB
:
214 return sizeof(struct switchdev_obj_port_mdb
);
221 static int switchdev_port_obj_notify(enum switchdev_notifier_type nt
,
222 struct net_device
*dev
,
223 const struct switchdev_obj
*obj
,
224 struct switchdev_trans
*trans
,
225 struct netlink_ext_ack
*extack
)
230 struct switchdev_notifier_port_obj_info obj_info
= {
236 rc
= call_switchdev_blocking_notifiers(nt
, dev
, &obj_info
.info
, extack
);
237 err
= notifier_to_errno(rc
);
239 WARN_ON(!obj_info
.handled
);
242 if (!obj_info
.handled
)
247 static int switchdev_port_obj_add_now(struct net_device
*dev
,
248 const struct switchdev_obj
*obj
,
249 struct netlink_ext_ack
*extack
)
251 struct switchdev_trans trans
;
256 /* Phase I: prepare for obj add. Driver/device should fail
257 * here if there are going to be issues in the commit phase,
258 * such as lack of resources or support. The driver/device
259 * should reserve resources needed for the commit phase here,
260 * but should not commit the obj.
263 trans
.ph_prepare
= true;
264 err
= switchdev_port_obj_notify(SWITCHDEV_PORT_OBJ_ADD
,
265 dev
, obj
, &trans
, extack
);
269 /* Phase II: commit obj add. This cannot fail as a fault
270 * of driver/device. If it does, it's a bug in the driver/device
271 * because the driver said everythings was OK in phase I.
274 trans
.ph_prepare
= false;
275 err
= switchdev_port_obj_notify(SWITCHDEV_PORT_OBJ_ADD
,
276 dev
, obj
, &trans
, extack
);
277 WARN(err
, "%s: Commit of object (id=%d) failed.\n", dev
->name
, obj
->id
);
282 static void switchdev_port_obj_add_deferred(struct net_device
*dev
,
285 const struct switchdev_obj
*obj
= data
;
288 err
= switchdev_port_obj_add_now(dev
, obj
, NULL
);
289 if (err
&& err
!= -EOPNOTSUPP
)
290 netdev_err(dev
, "failed (err=%d) to add object (id=%d)\n",
293 obj
->complete(dev
, err
, obj
->complete_priv
);
296 static int switchdev_port_obj_add_defer(struct net_device
*dev
,
297 const struct switchdev_obj
*obj
)
299 return switchdev_deferred_enqueue(dev
, obj
, switchdev_obj_size(obj
),
300 switchdev_port_obj_add_deferred
);
304 * switchdev_port_obj_add - Add port object
308 * @obj: object to add
310 * Use a 2-phase prepare-commit transaction model to ensure
311 * system is not left in a partially updated state due to
312 * failure from driver/device.
314 * rtnl_lock must be held and must not be in atomic section,
315 * in case SWITCHDEV_F_DEFER flag is not set.
317 int switchdev_port_obj_add(struct net_device
*dev
,
318 const struct switchdev_obj
*obj
,
319 struct netlink_ext_ack
*extack
)
321 if (obj
->flags
& SWITCHDEV_F_DEFER
)
322 return switchdev_port_obj_add_defer(dev
, obj
);
324 return switchdev_port_obj_add_now(dev
, obj
, extack
);
326 EXPORT_SYMBOL_GPL(switchdev_port_obj_add
);
328 static int switchdev_port_obj_del_now(struct net_device
*dev
,
329 const struct switchdev_obj
*obj
)
331 return switchdev_port_obj_notify(SWITCHDEV_PORT_OBJ_DEL
,
332 dev
, obj
, NULL
, NULL
);
335 static void switchdev_port_obj_del_deferred(struct net_device
*dev
,
338 const struct switchdev_obj
*obj
= data
;
341 err
= switchdev_port_obj_del_now(dev
, obj
);
342 if (err
&& err
!= -EOPNOTSUPP
)
343 netdev_err(dev
, "failed (err=%d) to del object (id=%d)\n",
346 obj
->complete(dev
, err
, obj
->complete_priv
);
349 static int switchdev_port_obj_del_defer(struct net_device
*dev
,
350 const struct switchdev_obj
*obj
)
352 return switchdev_deferred_enqueue(dev
, obj
, switchdev_obj_size(obj
),
353 switchdev_port_obj_del_deferred
);
357 * switchdev_port_obj_del - Delete port object
361 * @obj: object to delete
363 * rtnl_lock must be held and must not be in atomic section,
364 * in case SWITCHDEV_F_DEFER flag is not set.
366 int switchdev_port_obj_del(struct net_device
*dev
,
367 const struct switchdev_obj
*obj
)
369 if (obj
->flags
& SWITCHDEV_F_DEFER
)
370 return switchdev_port_obj_del_defer(dev
, obj
);
372 return switchdev_port_obj_del_now(dev
, obj
);
374 EXPORT_SYMBOL_GPL(switchdev_port_obj_del
);
376 static ATOMIC_NOTIFIER_HEAD(switchdev_notif_chain
);
377 static BLOCKING_NOTIFIER_HEAD(switchdev_blocking_notif_chain
);
380 * register_switchdev_notifier - Register notifier
381 * @nb: notifier_block
383 * Register switch device notifier.
385 int register_switchdev_notifier(struct notifier_block
*nb
)
387 return atomic_notifier_chain_register(&switchdev_notif_chain
, nb
);
389 EXPORT_SYMBOL_GPL(register_switchdev_notifier
);
392 * unregister_switchdev_notifier - Unregister notifier
393 * @nb: notifier_block
395 * Unregister switch device notifier.
397 int unregister_switchdev_notifier(struct notifier_block
*nb
)
399 return atomic_notifier_chain_unregister(&switchdev_notif_chain
, nb
);
401 EXPORT_SYMBOL_GPL(unregister_switchdev_notifier
);
404 * call_switchdev_notifiers - Call notifiers
405 * @val: value passed unmodified to notifier function
407 * @info: notifier information data
409 * Call all network notifier blocks.
411 int call_switchdev_notifiers(unsigned long val
, struct net_device
*dev
,
412 struct switchdev_notifier_info
*info
,
413 struct netlink_ext_ack
*extack
)
416 info
->extack
= extack
;
417 return atomic_notifier_call_chain(&switchdev_notif_chain
, val
, info
);
419 EXPORT_SYMBOL_GPL(call_switchdev_notifiers
);
421 int register_switchdev_blocking_notifier(struct notifier_block
*nb
)
423 struct blocking_notifier_head
*chain
= &switchdev_blocking_notif_chain
;
425 return blocking_notifier_chain_register(chain
, nb
);
427 EXPORT_SYMBOL_GPL(register_switchdev_blocking_notifier
);
429 int unregister_switchdev_blocking_notifier(struct notifier_block
*nb
)
431 struct blocking_notifier_head
*chain
= &switchdev_blocking_notif_chain
;
433 return blocking_notifier_chain_unregister(chain
, nb
);
435 EXPORT_SYMBOL_GPL(unregister_switchdev_blocking_notifier
);
437 int call_switchdev_blocking_notifiers(unsigned long val
, struct net_device
*dev
,
438 struct switchdev_notifier_info
*info
,
439 struct netlink_ext_ack
*extack
)
442 info
->extack
= extack
;
443 return blocking_notifier_call_chain(&switchdev_blocking_notif_chain
,
446 EXPORT_SYMBOL_GPL(call_switchdev_blocking_notifiers
);
448 static int __switchdev_handle_port_obj_add(struct net_device
*dev
,
449 struct switchdev_notifier_port_obj_info
*port_obj_info
,
450 bool (*check_cb
)(const struct net_device
*dev
),
451 int (*add_cb
)(struct net_device
*dev
,
452 const struct switchdev_obj
*obj
,
453 struct switchdev_trans
*trans
,
454 struct netlink_ext_ack
*extack
))
456 struct netlink_ext_ack
*extack
;
457 struct net_device
*lower_dev
;
458 struct list_head
*iter
;
459 int err
= -EOPNOTSUPP
;
461 extack
= switchdev_notifier_info_to_extack(&port_obj_info
->info
);
464 /* This flag is only checked if the return value is success. */
465 port_obj_info
->handled
= true;
466 return add_cb(dev
, port_obj_info
->obj
, port_obj_info
->trans
,
470 /* Switch ports might be stacked under e.g. a LAG. Ignore the
471 * unsupported devices, another driver might be able to handle them. But
472 * propagate to the callers any hard errors.
474 * If the driver does its own bookkeeping of stacked ports, it's not
475 * necessary to go through this helper.
477 netdev_for_each_lower_dev(dev
, lower_dev
, iter
) {
478 if (netif_is_bridge_master(lower_dev
))
481 err
= __switchdev_handle_port_obj_add(lower_dev
, port_obj_info
,
483 if (err
&& err
!= -EOPNOTSUPP
)
490 int switchdev_handle_port_obj_add(struct net_device
*dev
,
491 struct switchdev_notifier_port_obj_info
*port_obj_info
,
492 bool (*check_cb
)(const struct net_device
*dev
),
493 int (*add_cb
)(struct net_device
*dev
,
494 const struct switchdev_obj
*obj
,
495 struct switchdev_trans
*trans
,
496 struct netlink_ext_ack
*extack
))
500 err
= __switchdev_handle_port_obj_add(dev
, port_obj_info
, check_cb
,
502 if (err
== -EOPNOTSUPP
)
506 EXPORT_SYMBOL_GPL(switchdev_handle_port_obj_add
);
508 static int __switchdev_handle_port_obj_del(struct net_device
*dev
,
509 struct switchdev_notifier_port_obj_info
*port_obj_info
,
510 bool (*check_cb
)(const struct net_device
*dev
),
511 int (*del_cb
)(struct net_device
*dev
,
512 const struct switchdev_obj
*obj
))
514 struct net_device
*lower_dev
;
515 struct list_head
*iter
;
516 int err
= -EOPNOTSUPP
;
519 /* This flag is only checked if the return value is success. */
520 port_obj_info
->handled
= true;
521 return del_cb(dev
, port_obj_info
->obj
);
524 /* Switch ports might be stacked under e.g. a LAG. Ignore the
525 * unsupported devices, another driver might be able to handle them. But
526 * propagate to the callers any hard errors.
528 * If the driver does its own bookkeeping of stacked ports, it's not
529 * necessary to go through this helper.
531 netdev_for_each_lower_dev(dev
, lower_dev
, iter
) {
532 if (netif_is_bridge_master(lower_dev
))
535 err
= __switchdev_handle_port_obj_del(lower_dev
, port_obj_info
,
537 if (err
&& err
!= -EOPNOTSUPP
)
544 int switchdev_handle_port_obj_del(struct net_device
*dev
,
545 struct switchdev_notifier_port_obj_info
*port_obj_info
,
546 bool (*check_cb
)(const struct net_device
*dev
),
547 int (*del_cb
)(struct net_device
*dev
,
548 const struct switchdev_obj
*obj
))
552 err
= __switchdev_handle_port_obj_del(dev
, port_obj_info
, check_cb
,
554 if (err
== -EOPNOTSUPP
)
558 EXPORT_SYMBOL_GPL(switchdev_handle_port_obj_del
);
560 static int __switchdev_handle_port_attr_set(struct net_device
*dev
,
561 struct switchdev_notifier_port_attr_info
*port_attr_info
,
562 bool (*check_cb
)(const struct net_device
*dev
),
563 int (*set_cb
)(struct net_device
*dev
,
564 const struct switchdev_attr
*attr
,
565 struct switchdev_trans
*trans
))
567 struct net_device
*lower_dev
;
568 struct list_head
*iter
;
569 int err
= -EOPNOTSUPP
;
572 port_attr_info
->handled
= true;
573 return set_cb(dev
, port_attr_info
->attr
,
574 port_attr_info
->trans
);
577 /* Switch ports might be stacked under e.g. a LAG. Ignore the
578 * unsupported devices, another driver might be able to handle them. But
579 * propagate to the callers any hard errors.
581 * If the driver does its own bookkeeping of stacked ports, it's not
582 * necessary to go through this helper.
584 netdev_for_each_lower_dev(dev
, lower_dev
, iter
) {
585 if (netif_is_bridge_master(lower_dev
))
588 err
= __switchdev_handle_port_attr_set(lower_dev
, port_attr_info
,
590 if (err
&& err
!= -EOPNOTSUPP
)
597 int switchdev_handle_port_attr_set(struct net_device
*dev
,
598 struct switchdev_notifier_port_attr_info
*port_attr_info
,
599 bool (*check_cb
)(const struct net_device
*dev
),
600 int (*set_cb
)(struct net_device
*dev
,
601 const struct switchdev_attr
*attr
,
602 struct switchdev_trans
*trans
))
606 err
= __switchdev_handle_port_attr_set(dev
, port_attr_info
, check_cb
,
608 if (err
== -EOPNOTSUPP
)
612 EXPORT_SYMBOL_GPL(switchdev_handle_port_attr_set
);