xref: /linux-6.15/net/switchdev/switchdev.c (revision 47d5b6db)
1007f790cSJiri Pirko /*
2007f790cSJiri Pirko  * net/switchdev/switchdev.c - Switch device API
37ea6eb3fSJiri Pirko  * Copyright (c) 2014-2015 Jiri Pirko <[email protected]>
4f8f21471SScott Feldman  * Copyright (c) 2014-2015 Scott Feldman <[email protected]>
5007f790cSJiri Pirko  *
6007f790cSJiri Pirko  * This program is free software; you can redistribute it and/or modify
7007f790cSJiri Pirko  * it under the terms of the GNU General Public License as published by
8007f790cSJiri Pirko  * the Free Software Foundation; either version 2 of the License, or
9007f790cSJiri Pirko  * (at your option) any later version.
10007f790cSJiri Pirko  */
11007f790cSJiri Pirko 
12007f790cSJiri Pirko #include <linux/kernel.h>
13007f790cSJiri Pirko #include <linux/types.h>
14007f790cSJiri Pirko #include <linux/init.h>
1503bf0c28SJiri Pirko #include <linux/mutex.h>
1603bf0c28SJiri Pirko #include <linux/notifier.h>
17007f790cSJiri Pirko #include <linux/netdevice.h>
18850d0cbcSJiri Pirko #include <linux/etherdevice.h>
1947f8328bSScott Feldman #include <linux/if_bridge.h>
207ea6eb3fSJiri Pirko #include <linux/list.h>
21793f4014SJiri Pirko #include <linux/workqueue.h>
2287aaf2caSNikolay Aleksandrov #include <linux/if_vlan.h>
234f2c6ae5SIdo Schimmel #include <linux/rtnetlink.h>
24007f790cSJiri Pirko #include <net/switchdev.h>
25007f790cSJiri Pirko 
26007f790cSJiri Pirko /**
277ea6eb3fSJiri Pirko  *	switchdev_trans_item_enqueue - Enqueue data item to transaction queue
287ea6eb3fSJiri Pirko  *
297ea6eb3fSJiri Pirko  *	@trans: transaction
307ea6eb3fSJiri Pirko  *	@data: pointer to data being queued
317ea6eb3fSJiri Pirko  *	@destructor: data destructor
327ea6eb3fSJiri Pirko  *	@tritem: transaction item being queued
337ea6eb3fSJiri Pirko  *
347ea6eb3fSJiri Pirko  *	Enqeueue data item to transaction queue. tritem is typically placed in
357ea6eb3fSJiri Pirko  *	cointainter pointed at by data pointer. Destructor is called on
367ea6eb3fSJiri Pirko  *	transaction abort and after successful commit phase in case
377ea6eb3fSJiri Pirko  *	the caller did not dequeue the item before.
387ea6eb3fSJiri Pirko  */
397ea6eb3fSJiri Pirko void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
407ea6eb3fSJiri Pirko 				  void *data, void (*destructor)(void const *),
417ea6eb3fSJiri Pirko 				  struct switchdev_trans_item *tritem)
427ea6eb3fSJiri Pirko {
437ea6eb3fSJiri Pirko 	tritem->data = data;
447ea6eb3fSJiri Pirko 	tritem->destructor = destructor;
457ea6eb3fSJiri Pirko 	list_add_tail(&tritem->list, &trans->item_list);
467ea6eb3fSJiri Pirko }
477ea6eb3fSJiri Pirko EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
487ea6eb3fSJiri Pirko 
497ea6eb3fSJiri Pirko static struct switchdev_trans_item *
507ea6eb3fSJiri Pirko __switchdev_trans_item_dequeue(struct switchdev_trans *trans)
517ea6eb3fSJiri Pirko {
527ea6eb3fSJiri Pirko 	struct switchdev_trans_item *tritem;
537ea6eb3fSJiri Pirko 
547ea6eb3fSJiri Pirko 	if (list_empty(&trans->item_list))
557ea6eb3fSJiri Pirko 		return NULL;
567ea6eb3fSJiri Pirko 	tritem = list_first_entry(&trans->item_list,
577ea6eb3fSJiri Pirko 				  struct switchdev_trans_item, list);
587ea6eb3fSJiri Pirko 	list_del(&tritem->list);
597ea6eb3fSJiri Pirko 	return tritem;
607ea6eb3fSJiri Pirko }
617ea6eb3fSJiri Pirko 
627ea6eb3fSJiri Pirko /**
637ea6eb3fSJiri Pirko  *	switchdev_trans_item_dequeue - Dequeue data item from transaction queue
647ea6eb3fSJiri Pirko  *
657ea6eb3fSJiri Pirko  *	@trans: transaction
667ea6eb3fSJiri Pirko  */
677ea6eb3fSJiri Pirko void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
687ea6eb3fSJiri Pirko {
697ea6eb3fSJiri Pirko 	struct switchdev_trans_item *tritem;
707ea6eb3fSJiri Pirko 
717ea6eb3fSJiri Pirko 	tritem = __switchdev_trans_item_dequeue(trans);
727ea6eb3fSJiri Pirko 	BUG_ON(!tritem);
737ea6eb3fSJiri Pirko 	return tritem->data;
747ea6eb3fSJiri Pirko }
757ea6eb3fSJiri Pirko EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
767ea6eb3fSJiri Pirko 
777ea6eb3fSJiri Pirko static void switchdev_trans_init(struct switchdev_trans *trans)
787ea6eb3fSJiri Pirko {
797ea6eb3fSJiri Pirko 	INIT_LIST_HEAD(&trans->item_list);
807ea6eb3fSJiri Pirko }
817ea6eb3fSJiri Pirko 
827ea6eb3fSJiri Pirko static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
837ea6eb3fSJiri Pirko {
847ea6eb3fSJiri Pirko 	struct switchdev_trans_item *tritem;
857ea6eb3fSJiri Pirko 
867ea6eb3fSJiri Pirko 	while ((tritem = __switchdev_trans_item_dequeue(trans)))
877ea6eb3fSJiri Pirko 		tritem->destructor(tritem->data);
887ea6eb3fSJiri Pirko }
897ea6eb3fSJiri Pirko 
907ea6eb3fSJiri Pirko static void switchdev_trans_items_warn_destroy(struct net_device *dev,
917ea6eb3fSJiri Pirko 					       struct switchdev_trans *trans)
927ea6eb3fSJiri Pirko {
937ea6eb3fSJiri Pirko 	WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
947ea6eb3fSJiri Pirko 	     dev->name);
957ea6eb3fSJiri Pirko 	switchdev_trans_items_destroy(trans);
967ea6eb3fSJiri Pirko }
977ea6eb3fSJiri Pirko 
98793f4014SJiri Pirko static LIST_HEAD(deferred);
99793f4014SJiri Pirko static DEFINE_SPINLOCK(deferred_lock);
100793f4014SJiri Pirko 
101793f4014SJiri Pirko typedef void switchdev_deferred_func_t(struct net_device *dev,
102793f4014SJiri Pirko 				       const void *data);
103793f4014SJiri Pirko 
104793f4014SJiri Pirko struct switchdev_deferred_item {
105793f4014SJiri Pirko 	struct list_head list;
106793f4014SJiri Pirko 	struct net_device *dev;
107793f4014SJiri Pirko 	switchdev_deferred_func_t *func;
108793f4014SJiri Pirko 	unsigned long data[0];
109793f4014SJiri Pirko };
110793f4014SJiri Pirko 
111793f4014SJiri Pirko static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
112793f4014SJiri Pirko {
113793f4014SJiri Pirko 	struct switchdev_deferred_item *dfitem;
114793f4014SJiri Pirko 
115793f4014SJiri Pirko 	spin_lock_bh(&deferred_lock);
116793f4014SJiri Pirko 	if (list_empty(&deferred)) {
117793f4014SJiri Pirko 		dfitem = NULL;
118793f4014SJiri Pirko 		goto unlock;
119793f4014SJiri Pirko 	}
120793f4014SJiri Pirko 	dfitem = list_first_entry(&deferred,
121793f4014SJiri Pirko 				  struct switchdev_deferred_item, list);
122793f4014SJiri Pirko 	list_del(&dfitem->list);
123793f4014SJiri Pirko unlock:
124793f4014SJiri Pirko 	spin_unlock_bh(&deferred_lock);
125793f4014SJiri Pirko 	return dfitem;
126793f4014SJiri Pirko }
127793f4014SJiri Pirko 
128793f4014SJiri Pirko /**
129793f4014SJiri Pirko  *	switchdev_deferred_process - Process ops in deferred queue
130793f4014SJiri Pirko  *
131793f4014SJiri Pirko  *	Called to flush the ops currently queued in deferred ops queue.
132793f4014SJiri Pirko  *	rtnl_lock must be held.
133793f4014SJiri Pirko  */
134793f4014SJiri Pirko void switchdev_deferred_process(void)
135793f4014SJiri Pirko {
136793f4014SJiri Pirko 	struct switchdev_deferred_item *dfitem;
137793f4014SJiri Pirko 
138793f4014SJiri Pirko 	ASSERT_RTNL();
139793f4014SJiri Pirko 
140793f4014SJiri Pirko 	while ((dfitem = switchdev_deferred_dequeue())) {
141793f4014SJiri Pirko 		dfitem->func(dfitem->dev, dfitem->data);
142793f4014SJiri Pirko 		dev_put(dfitem->dev);
143793f4014SJiri Pirko 		kfree(dfitem);
144793f4014SJiri Pirko 	}
145793f4014SJiri Pirko }
146793f4014SJiri Pirko EXPORT_SYMBOL_GPL(switchdev_deferred_process);
147793f4014SJiri Pirko 
148793f4014SJiri Pirko static void switchdev_deferred_process_work(struct work_struct *work)
149793f4014SJiri Pirko {
150793f4014SJiri Pirko 	rtnl_lock();
151793f4014SJiri Pirko 	switchdev_deferred_process();
152793f4014SJiri Pirko 	rtnl_unlock();
153793f4014SJiri Pirko }
154793f4014SJiri Pirko 
155793f4014SJiri Pirko static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
156793f4014SJiri Pirko 
157793f4014SJiri Pirko static int switchdev_deferred_enqueue(struct net_device *dev,
158793f4014SJiri Pirko 				      const void *data, size_t data_len,
159793f4014SJiri Pirko 				      switchdev_deferred_func_t *func)
160793f4014SJiri Pirko {
161793f4014SJiri Pirko 	struct switchdev_deferred_item *dfitem;
162793f4014SJiri Pirko 
163793f4014SJiri Pirko 	dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
164793f4014SJiri Pirko 	if (!dfitem)
165793f4014SJiri Pirko 		return -ENOMEM;
166793f4014SJiri Pirko 	dfitem->dev = dev;
167793f4014SJiri Pirko 	dfitem->func = func;
168793f4014SJiri Pirko 	memcpy(dfitem->data, data, data_len);
169793f4014SJiri Pirko 	dev_hold(dev);
170793f4014SJiri Pirko 	spin_lock_bh(&deferred_lock);
171793f4014SJiri Pirko 	list_add_tail(&dfitem->list, &deferred);
172793f4014SJiri Pirko 	spin_unlock_bh(&deferred_lock);
173793f4014SJiri Pirko 	schedule_work(&deferred_process_work);
174793f4014SJiri Pirko 	return 0;
175793f4014SJiri Pirko }
176793f4014SJiri Pirko 
1777ea6eb3fSJiri Pirko /**
1783094333dSScott Feldman  *	switchdev_port_attr_get - Get port attribute
1793094333dSScott Feldman  *
1803094333dSScott Feldman  *	@dev: port device
1813094333dSScott Feldman  *	@attr: attribute to get
1823094333dSScott Feldman  */
1833094333dSScott Feldman int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
1843094333dSScott Feldman {
1853094333dSScott Feldman 	const struct switchdev_ops *ops = dev->switchdev_ops;
1863094333dSScott Feldman 	struct net_device *lower_dev;
1873094333dSScott Feldman 	struct list_head *iter;
1883094333dSScott Feldman 	struct switchdev_attr first = {
1891f868398SJiri Pirko 		.id = SWITCHDEV_ATTR_ID_UNDEFINED
1903094333dSScott Feldman 	};
1913094333dSScott Feldman 	int err = -EOPNOTSUPP;
1923094333dSScott Feldman 
1933094333dSScott Feldman 	if (ops && ops->switchdev_port_attr_get)
1943094333dSScott Feldman 		return ops->switchdev_port_attr_get(dev, attr);
1953094333dSScott Feldman 
1963094333dSScott Feldman 	if (attr->flags & SWITCHDEV_F_NO_RECURSE)
1973094333dSScott Feldman 		return err;
1983094333dSScott Feldman 
1993094333dSScott Feldman 	/* Switch device port(s) may be stacked under
2003094333dSScott Feldman 	 * bond/team/vlan dev, so recurse down to get attr on
2013094333dSScott Feldman 	 * each port.  Return -ENODATA if attr values don't
2023094333dSScott Feldman 	 * compare across ports.
2033094333dSScott Feldman 	 */
2043094333dSScott Feldman 
2053094333dSScott Feldman 	netdev_for_each_lower_dev(dev, lower_dev, iter) {
2063094333dSScott Feldman 		err = switchdev_port_attr_get(lower_dev, attr);
2073094333dSScott Feldman 		if (err)
2083094333dSScott Feldman 			break;
2091f868398SJiri Pirko 		if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
2103094333dSScott Feldman 			first = *attr;
2113094333dSScott Feldman 		else if (memcmp(&first, attr, sizeof(*attr)))
2123094333dSScott Feldman 			return -ENODATA;
2133094333dSScott Feldman 	}
2143094333dSScott Feldman 
2153094333dSScott Feldman 	return err;
2163094333dSScott Feldman }
2173094333dSScott Feldman EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
2183094333dSScott Feldman 
2193094333dSScott Feldman static int __switchdev_port_attr_set(struct net_device *dev,
220f7fadf30SJiri Pirko 				     const struct switchdev_attr *attr,
2217ea6eb3fSJiri Pirko 				     struct switchdev_trans *trans)
2223094333dSScott Feldman {
2233094333dSScott Feldman 	const struct switchdev_ops *ops = dev->switchdev_ops;
2243094333dSScott Feldman 	struct net_device *lower_dev;
2253094333dSScott Feldman 	struct list_head *iter;
2263094333dSScott Feldman 	int err = -EOPNOTSUPP;
2273094333dSScott Feldman 
2280c63d80cSJiri Pirko 	if (ops && ops->switchdev_port_attr_set) {
2290c63d80cSJiri Pirko 		err = ops->switchdev_port_attr_set(dev, attr, trans);
2300c63d80cSJiri Pirko 		goto done;
2310c63d80cSJiri Pirko 	}
2323094333dSScott Feldman 
2333094333dSScott Feldman 	if (attr->flags & SWITCHDEV_F_NO_RECURSE)
234464314eaSScott Feldman 		goto done;
2353094333dSScott Feldman 
2363094333dSScott Feldman 	/* Switch device port(s) may be stacked under
2373094333dSScott Feldman 	 * bond/team/vlan dev, so recurse down to set attr on
2383094333dSScott Feldman 	 * each port.
2393094333dSScott Feldman 	 */
2403094333dSScott Feldman 
2413094333dSScott Feldman 	netdev_for_each_lower_dev(dev, lower_dev, iter) {
2427ea6eb3fSJiri Pirko 		err = __switchdev_port_attr_set(lower_dev, attr, trans);
2433094333dSScott Feldman 		if (err)
2443094333dSScott Feldman 			break;
2453094333dSScott Feldman 	}
2463094333dSScott Feldman 
247464314eaSScott Feldman done:
248464314eaSScott Feldman 	if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
249464314eaSScott Feldman 		err = 0;
250464314eaSScott Feldman 
2513094333dSScott Feldman 	return err;
2523094333dSScott Feldman }
2533094333dSScott Feldman 
2540bc05d58SJiri Pirko static int switchdev_port_attr_set_now(struct net_device *dev,
255f7fadf30SJiri Pirko 				       const struct switchdev_attr *attr)
2563094333dSScott Feldman {
2577ea6eb3fSJiri Pirko 	struct switchdev_trans trans;
2583094333dSScott Feldman 	int err;
2593094333dSScott Feldman 
2607ea6eb3fSJiri Pirko 	switchdev_trans_init(&trans);
2617ea6eb3fSJiri Pirko 
2623094333dSScott Feldman 	/* Phase I: prepare for attr set. Driver/device should fail
2633094333dSScott Feldman 	 * here if there are going to be issues in the commit phase,
2643094333dSScott Feldman 	 * such as lack of resources or support.  The driver/device
2653094333dSScott Feldman 	 * should reserve resources needed for the commit phase here,
2663094333dSScott Feldman 	 * but should not commit the attr.
2673094333dSScott Feldman 	 */
2683094333dSScott Feldman 
269f623ab7fSJiri Pirko 	trans.ph_prepare = true;
2707ea6eb3fSJiri Pirko 	err = __switchdev_port_attr_set(dev, attr, &trans);
2713094333dSScott Feldman 	if (err) {
2723094333dSScott Feldman 		/* Prepare phase failed: abort the transaction.  Any
2733094333dSScott Feldman 		 * resources reserved in the prepare phase are
2743094333dSScott Feldman 		 * released.
2753094333dSScott Feldman 		 */
2763094333dSScott Feldman 
2779f6467cfSJiri Pirko 		if (err != -EOPNOTSUPP)
2787ea6eb3fSJiri Pirko 			switchdev_trans_items_destroy(&trans);
2793094333dSScott Feldman 
2803094333dSScott Feldman 		return err;
2813094333dSScott Feldman 	}
2823094333dSScott Feldman 
2833094333dSScott Feldman 	/* Phase II: commit attr set.  This cannot fail as a fault
2843094333dSScott Feldman 	 * of driver/device.  If it does, it's a bug in the driver/device
2853094333dSScott Feldman 	 * because the driver said everythings was OK in phase I.
2863094333dSScott Feldman 	 */
2873094333dSScott Feldman 
288f623ab7fSJiri Pirko 	trans.ph_prepare = false;
2897ea6eb3fSJiri Pirko 	err = __switchdev_port_attr_set(dev, attr, &trans);
290e9fdaec0SScott Feldman 	WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
291e9fdaec0SScott Feldman 	     dev->name, attr->id);
2927ea6eb3fSJiri Pirko 	switchdev_trans_items_warn_destroy(dev, &trans);
2933094333dSScott Feldman 
2943094333dSScott Feldman 	return err;
2953094333dSScott Feldman }
2960bc05d58SJiri Pirko 
2970bc05d58SJiri Pirko static void switchdev_port_attr_set_deferred(struct net_device *dev,
2980bc05d58SJiri Pirko 					     const void *data)
2990bc05d58SJiri Pirko {
3000bc05d58SJiri Pirko 	const struct switchdev_attr *attr = data;
3010bc05d58SJiri Pirko 	int err;
3020bc05d58SJiri Pirko 
3030bc05d58SJiri Pirko 	err = switchdev_port_attr_set_now(dev, attr);
3040bc05d58SJiri Pirko 	if (err && err != -EOPNOTSUPP)
3050bc05d58SJiri Pirko 		netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
3060bc05d58SJiri Pirko 			   err, attr->id);
3077ceb2afbSElad Raz 	if (attr->complete)
3087ceb2afbSElad Raz 		attr->complete(dev, err, attr->complete_priv);
3090bc05d58SJiri Pirko }
3100bc05d58SJiri Pirko 
3110bc05d58SJiri Pirko static int switchdev_port_attr_set_defer(struct net_device *dev,
3120bc05d58SJiri Pirko 					 const struct switchdev_attr *attr)
3130bc05d58SJiri Pirko {
3140bc05d58SJiri Pirko 	return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
3150bc05d58SJiri Pirko 					  switchdev_port_attr_set_deferred);
3160bc05d58SJiri Pirko }
3170bc05d58SJiri Pirko 
3180bc05d58SJiri Pirko /**
3190bc05d58SJiri Pirko  *	switchdev_port_attr_set - Set port attribute
3200bc05d58SJiri Pirko  *
3210bc05d58SJiri Pirko  *	@dev: port device
3220bc05d58SJiri Pirko  *	@attr: attribute to set
3230bc05d58SJiri Pirko  *
3240bc05d58SJiri Pirko  *	Use a 2-phase prepare-commit transaction model to ensure
3250bc05d58SJiri Pirko  *	system is not left in a partially updated state due to
3260bc05d58SJiri Pirko  *	failure from driver/device.
3270bc05d58SJiri Pirko  *
3280bc05d58SJiri Pirko  *	rtnl_lock must be held and must not be in atomic section,
3290bc05d58SJiri Pirko  *	in case SWITCHDEV_F_DEFER flag is not set.
3300bc05d58SJiri Pirko  */
3310bc05d58SJiri Pirko int switchdev_port_attr_set(struct net_device *dev,
3320bc05d58SJiri Pirko 			    const struct switchdev_attr *attr)
3330bc05d58SJiri Pirko {
3340bc05d58SJiri Pirko 	if (attr->flags & SWITCHDEV_F_DEFER)
3350bc05d58SJiri Pirko 		return switchdev_port_attr_set_defer(dev, attr);
3360bc05d58SJiri Pirko 	ASSERT_RTNL();
3370bc05d58SJiri Pirko 	return switchdev_port_attr_set_now(dev, attr);
3380bc05d58SJiri Pirko }
3393094333dSScott Feldman EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
3403094333dSScott Feldman 
341e258d919SScott Feldman static size_t switchdev_obj_size(const struct switchdev_obj *obj)
342e258d919SScott Feldman {
343e258d919SScott Feldman 	switch (obj->id) {
344e258d919SScott Feldman 	case SWITCHDEV_OBJ_ID_PORT_VLAN:
345e258d919SScott Feldman 		return sizeof(struct switchdev_obj_port_vlan);
3464d41e125SElad Raz 	case SWITCHDEV_OBJ_ID_PORT_MDB:
3474d41e125SElad Raz 		return sizeof(struct switchdev_obj_port_mdb);
348*47d5b6dbSAndrew Lunn 	case SWITCHDEV_OBJ_ID_HOST_MDB:
349*47d5b6dbSAndrew Lunn 		return sizeof(struct switchdev_obj_port_mdb);
350e258d919SScott Feldman 	default:
351e258d919SScott Feldman 		BUG();
352e258d919SScott Feldman 	}
353e258d919SScott Feldman 	return 0;
354e258d919SScott Feldman }
355e258d919SScott Feldman 
35622c1f67eSScott Feldman static int __switchdev_port_obj_add(struct net_device *dev,
357648b4a99SJiri Pirko 				    const struct switchdev_obj *obj,
3587ea6eb3fSJiri Pirko 				    struct switchdev_trans *trans)
359491d0f15SScott Feldman {
360491d0f15SScott Feldman 	const struct switchdev_ops *ops = dev->switchdev_ops;
361491d0f15SScott Feldman 	struct net_device *lower_dev;
362491d0f15SScott Feldman 	struct list_head *iter;
363491d0f15SScott Feldman 	int err = -EOPNOTSUPP;
364491d0f15SScott Feldman 
365491d0f15SScott Feldman 	if (ops && ops->switchdev_port_obj_add)
3669e8f4a54SJiri Pirko 		return ops->switchdev_port_obj_add(dev, obj, trans);
367491d0f15SScott Feldman 
368491d0f15SScott Feldman 	/* Switch device port(s) may be stacked under
369491d0f15SScott Feldman 	 * bond/team/vlan dev, so recurse down to add object on
370491d0f15SScott Feldman 	 * each port.
371491d0f15SScott Feldman 	 */
372491d0f15SScott Feldman 
373491d0f15SScott Feldman 	netdev_for_each_lower_dev(dev, lower_dev, iter) {
3749e8f4a54SJiri Pirko 		err = __switchdev_port_obj_add(lower_dev, obj, trans);
375491d0f15SScott Feldman 		if (err)
376491d0f15SScott Feldman 			break;
377491d0f15SScott Feldman 	}
378491d0f15SScott Feldman 
379491d0f15SScott Feldman 	return err;
380491d0f15SScott Feldman }
381491d0f15SScott Feldman 
3824d429c5dSJiri Pirko static int switchdev_port_obj_add_now(struct net_device *dev,
383648b4a99SJiri Pirko 				      const struct switchdev_obj *obj)
384491d0f15SScott Feldman {
3857ea6eb3fSJiri Pirko 	struct switchdev_trans trans;
386491d0f15SScott Feldman 	int err;
387491d0f15SScott Feldman 
388491d0f15SScott Feldman 	ASSERT_RTNL();
389491d0f15SScott Feldman 
3907ea6eb3fSJiri Pirko 	switchdev_trans_init(&trans);
3917ea6eb3fSJiri Pirko 
392491d0f15SScott Feldman 	/* Phase I: prepare for obj add. Driver/device should fail
393491d0f15SScott Feldman 	 * here if there are going to be issues in the commit phase,
394491d0f15SScott Feldman 	 * such as lack of resources or support.  The driver/device
395491d0f15SScott Feldman 	 * should reserve resources needed for the commit phase here,
396491d0f15SScott Feldman 	 * but should not commit the obj.
397491d0f15SScott Feldman 	 */
398491d0f15SScott Feldman 
399f623ab7fSJiri Pirko 	trans.ph_prepare = true;
4009e8f4a54SJiri Pirko 	err = __switchdev_port_obj_add(dev, obj, &trans);
401491d0f15SScott Feldman 	if (err) {
402491d0f15SScott Feldman 		/* Prepare phase failed: abort the transaction.  Any
403491d0f15SScott Feldman 		 * resources reserved in the prepare phase are
404491d0f15SScott Feldman 		 * released.
405491d0f15SScott Feldman 		 */
406491d0f15SScott Feldman 
4079f6467cfSJiri Pirko 		if (err != -EOPNOTSUPP)
4087ea6eb3fSJiri Pirko 			switchdev_trans_items_destroy(&trans);
409491d0f15SScott Feldman 
410491d0f15SScott Feldman 		return err;
411491d0f15SScott Feldman 	}
412491d0f15SScott Feldman 
413491d0f15SScott Feldman 	/* Phase II: commit obj add.  This cannot fail as a fault
414491d0f15SScott Feldman 	 * of driver/device.  If it does, it's a bug in the driver/device
415491d0f15SScott Feldman 	 * because the driver said everythings was OK in phase I.
416491d0f15SScott Feldman 	 */
417491d0f15SScott Feldman 
418f623ab7fSJiri Pirko 	trans.ph_prepare = false;
4199e8f4a54SJiri Pirko 	err = __switchdev_port_obj_add(dev, obj, &trans);
4209e8f4a54SJiri Pirko 	WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
4217ea6eb3fSJiri Pirko 	switchdev_trans_items_warn_destroy(dev, &trans);
422491d0f15SScott Feldman 
423491d0f15SScott Feldman 	return err;
424491d0f15SScott Feldman }
4254d429c5dSJiri Pirko 
4264d429c5dSJiri Pirko static void switchdev_port_obj_add_deferred(struct net_device *dev,
4274d429c5dSJiri Pirko 					    const void *data)
4284d429c5dSJiri Pirko {
4294d429c5dSJiri Pirko 	const struct switchdev_obj *obj = data;
4304d429c5dSJiri Pirko 	int err;
4314d429c5dSJiri Pirko 
4324d429c5dSJiri Pirko 	err = switchdev_port_obj_add_now(dev, obj);
4334d429c5dSJiri Pirko 	if (err && err != -EOPNOTSUPP)
4344d429c5dSJiri Pirko 		netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
4354d429c5dSJiri Pirko 			   err, obj->id);
4367ceb2afbSElad Raz 	if (obj->complete)
4377ceb2afbSElad Raz 		obj->complete(dev, err, obj->complete_priv);
4384d429c5dSJiri Pirko }
4394d429c5dSJiri Pirko 
4404d429c5dSJiri Pirko static int switchdev_port_obj_add_defer(struct net_device *dev,
4414d429c5dSJiri Pirko 					const struct switchdev_obj *obj)
4424d429c5dSJiri Pirko {
443e258d919SScott Feldman 	return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
4444d429c5dSJiri Pirko 					  switchdev_port_obj_add_deferred);
4454d429c5dSJiri Pirko }
446491d0f15SScott Feldman 
447491d0f15SScott Feldman /**
4484d429c5dSJiri Pirko  *	switchdev_port_obj_add - Add port object
449491d0f15SScott Feldman  *
450491d0f15SScott Feldman  *	@dev: port device
451ab069002SVivien Didelot  *	@id: object ID
4524d429c5dSJiri Pirko  *	@obj: object to add
4534d429c5dSJiri Pirko  *
4544d429c5dSJiri Pirko  *	Use a 2-phase prepare-commit transaction model to ensure
4554d429c5dSJiri Pirko  *	system is not left in a partially updated state due to
4564d429c5dSJiri Pirko  *	failure from driver/device.
4574d429c5dSJiri Pirko  *
4584d429c5dSJiri Pirko  *	rtnl_lock must be held and must not be in atomic section,
4594d429c5dSJiri Pirko  *	in case SWITCHDEV_F_DEFER flag is not set.
460491d0f15SScott Feldman  */
4614d429c5dSJiri Pirko int switchdev_port_obj_add(struct net_device *dev,
4624d429c5dSJiri Pirko 			   const struct switchdev_obj *obj)
4634d429c5dSJiri Pirko {
4644d429c5dSJiri Pirko 	if (obj->flags & SWITCHDEV_F_DEFER)
4654d429c5dSJiri Pirko 		return switchdev_port_obj_add_defer(dev, obj);
4664d429c5dSJiri Pirko 	ASSERT_RTNL();
4674d429c5dSJiri Pirko 	return switchdev_port_obj_add_now(dev, obj);
4684d429c5dSJiri Pirko }
4694d429c5dSJiri Pirko EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
4704d429c5dSJiri Pirko 
4714d429c5dSJiri Pirko static int switchdev_port_obj_del_now(struct net_device *dev,
472648b4a99SJiri Pirko 				      const struct switchdev_obj *obj)
473491d0f15SScott Feldman {
474491d0f15SScott Feldman 	const struct switchdev_ops *ops = dev->switchdev_ops;
475491d0f15SScott Feldman 	struct net_device *lower_dev;
476491d0f15SScott Feldman 	struct list_head *iter;
477491d0f15SScott Feldman 	int err = -EOPNOTSUPP;
478491d0f15SScott Feldman 
479491d0f15SScott Feldman 	if (ops && ops->switchdev_port_obj_del)
4809e8f4a54SJiri Pirko 		return ops->switchdev_port_obj_del(dev, obj);
481491d0f15SScott Feldman 
482491d0f15SScott Feldman 	/* Switch device port(s) may be stacked under
483491d0f15SScott Feldman 	 * bond/team/vlan dev, so recurse down to delete object on
484491d0f15SScott Feldman 	 * each port.
485491d0f15SScott Feldman 	 */
486491d0f15SScott Feldman 
487491d0f15SScott Feldman 	netdev_for_each_lower_dev(dev, lower_dev, iter) {
4884d429c5dSJiri Pirko 		err = switchdev_port_obj_del_now(lower_dev, obj);
489491d0f15SScott Feldman 		if (err)
490491d0f15SScott Feldman 			break;
491491d0f15SScott Feldman 	}
492491d0f15SScott Feldman 
493491d0f15SScott Feldman 	return err;
494491d0f15SScott Feldman }
4954d429c5dSJiri Pirko 
4964d429c5dSJiri Pirko static void switchdev_port_obj_del_deferred(struct net_device *dev,
4974d429c5dSJiri Pirko 					    const void *data)
4984d429c5dSJiri Pirko {
4994d429c5dSJiri Pirko 	const struct switchdev_obj *obj = data;
5004d429c5dSJiri Pirko 	int err;
5014d429c5dSJiri Pirko 
5024d429c5dSJiri Pirko 	err = switchdev_port_obj_del_now(dev, obj);
5034d429c5dSJiri Pirko 	if (err && err != -EOPNOTSUPP)
5044d429c5dSJiri Pirko 		netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
5054d429c5dSJiri Pirko 			   err, obj->id);
5067ceb2afbSElad Raz 	if (obj->complete)
5077ceb2afbSElad Raz 		obj->complete(dev, err, obj->complete_priv);
5084d429c5dSJiri Pirko }
5094d429c5dSJiri Pirko 
5104d429c5dSJiri Pirko static int switchdev_port_obj_del_defer(struct net_device *dev,
5114d429c5dSJiri Pirko 					const struct switchdev_obj *obj)
5124d429c5dSJiri Pirko {
513e258d919SScott Feldman 	return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
5144d429c5dSJiri Pirko 					  switchdev_port_obj_del_deferred);
5154d429c5dSJiri Pirko }
5164d429c5dSJiri Pirko 
5174d429c5dSJiri Pirko /**
5184d429c5dSJiri Pirko  *	switchdev_port_obj_del - Delete port object
5194d429c5dSJiri Pirko  *
5204d429c5dSJiri Pirko  *	@dev: port device
5214d429c5dSJiri Pirko  *	@id: object ID
5224d429c5dSJiri Pirko  *	@obj: object to delete
5234d429c5dSJiri Pirko  *
5244d429c5dSJiri Pirko  *	rtnl_lock must be held and must not be in atomic section,
5254d429c5dSJiri Pirko  *	in case SWITCHDEV_F_DEFER flag is not set.
5264d429c5dSJiri Pirko  */
5274d429c5dSJiri Pirko int switchdev_port_obj_del(struct net_device *dev,
5284d429c5dSJiri Pirko 			   const struct switchdev_obj *obj)
5294d429c5dSJiri Pirko {
5304d429c5dSJiri Pirko 	if (obj->flags & SWITCHDEV_F_DEFER)
5314d429c5dSJiri Pirko 		return switchdev_port_obj_del_defer(dev, obj);
5324d429c5dSJiri Pirko 	ASSERT_RTNL();
5334d429c5dSJiri Pirko 	return switchdev_port_obj_del_now(dev, obj);
5344d429c5dSJiri Pirko }
535491d0f15SScott Feldman EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
536491d0f15SScott Feldman 
537ff5cf100SArkadi Sharshevsky static ATOMIC_NOTIFIER_HEAD(switchdev_notif_chain);
53803bf0c28SJiri Pirko 
53903bf0c28SJiri Pirko /**
540ebb9a03aSJiri Pirko  *	register_switchdev_notifier - Register notifier
54103bf0c28SJiri Pirko  *	@nb: notifier_block
54203bf0c28SJiri Pirko  *
543ff5cf100SArkadi Sharshevsky  *	Register switch device notifier.
54403bf0c28SJiri Pirko  */
545ebb9a03aSJiri Pirko int register_switchdev_notifier(struct notifier_block *nb)
54603bf0c28SJiri Pirko {
547ff5cf100SArkadi Sharshevsky 	return atomic_notifier_chain_register(&switchdev_notif_chain, nb);
54803bf0c28SJiri Pirko }
549ebb9a03aSJiri Pirko EXPORT_SYMBOL_GPL(register_switchdev_notifier);
55003bf0c28SJiri Pirko 
55103bf0c28SJiri Pirko /**
552ebb9a03aSJiri Pirko  *	unregister_switchdev_notifier - Unregister notifier
55303bf0c28SJiri Pirko  *	@nb: notifier_block
55403bf0c28SJiri Pirko  *
55503bf0c28SJiri Pirko  *	Unregister switch device notifier.
55603bf0c28SJiri Pirko  */
557ebb9a03aSJiri Pirko int unregister_switchdev_notifier(struct notifier_block *nb)
55803bf0c28SJiri Pirko {
559ff5cf100SArkadi Sharshevsky 	return atomic_notifier_chain_unregister(&switchdev_notif_chain, nb);
56003bf0c28SJiri Pirko }
561ebb9a03aSJiri Pirko EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
56203bf0c28SJiri Pirko 
56303bf0c28SJiri Pirko /**
564ebb9a03aSJiri Pirko  *	call_switchdev_notifiers - Call notifiers
56503bf0c28SJiri Pirko  *	@val: value passed unmodified to notifier function
56603bf0c28SJiri Pirko  *	@dev: port device
56703bf0c28SJiri Pirko  *	@info: notifier information data
56803bf0c28SJiri Pirko  *
569ff5cf100SArkadi Sharshevsky  *	Call all network notifier blocks.
57003bf0c28SJiri Pirko  */
571ebb9a03aSJiri Pirko int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
572ebb9a03aSJiri Pirko 			     struct switchdev_notifier_info *info)
57303bf0c28SJiri Pirko {
57403bf0c28SJiri Pirko 	info->dev = dev;
575ff5cf100SArkadi Sharshevsky 	return atomic_notifier_call_chain(&switchdev_notif_chain, val, info);
57603bf0c28SJiri Pirko }
577ebb9a03aSJiri Pirko EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
5788a44dbb2SRoopa Prabhu 
5798438884dSOr Gerlitz bool switchdev_port_same_parent_id(struct net_device *a,
5801a3b2ec9SScott Feldman 				   struct net_device *b)
5811a3b2ec9SScott Feldman {
5821a3b2ec9SScott Feldman 	struct switchdev_attr a_attr = {
5836ff64f6fSIdo Schimmel 		.orig_dev = a,
5841f868398SJiri Pirko 		.id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
5851a3b2ec9SScott Feldman 	};
5861a3b2ec9SScott Feldman 	struct switchdev_attr b_attr = {
5876ff64f6fSIdo Schimmel 		.orig_dev = b,
5881f868398SJiri Pirko 		.id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
5891a3b2ec9SScott Feldman 	};
5901a3b2ec9SScott Feldman 
5911a3b2ec9SScott Feldman 	if (switchdev_port_attr_get(a, &a_attr) ||
5921a3b2ec9SScott Feldman 	    switchdev_port_attr_get(b, &b_attr))
5931a3b2ec9SScott Feldman 		return false;
5941a3b2ec9SScott Feldman 
5951a3b2ec9SScott Feldman 	return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
5961a3b2ec9SScott Feldman }
5972eb03e6cSOr Gerlitz EXPORT_SYMBOL_GPL(switchdev_port_same_parent_id);
598