mirror of
https://github.com/tbsdtv/linux_media.git
synced 2025-07-23 04:33:26 +02:00
The call path of a switchdev VLAN addition to the bridge looks something like this today: nbp_vlan_init | __br_vlan_set_default_pvid | | | | | br_afspec | | | | | | | v | | | br_process_vlan_info | | | | | | | v | | | br_vlan_info | | | / \ / | | / \ / | | / \ / | | / \ / v v v v v nbp_vlan_add br_vlan_add ------+ | ^ ^ | | | / | | | | / / / | \ br_vlan_get_master/ / v \ ^ / / br_vlan_add_existing \ | / / | \ | / / / \ | / / / \ | / / / \ | / / / v | | v / __vlan_add / / | / / | / v | / __vlan_vid_add | / \ | / v v v br_switchdev_port_vlan_add The ranges UAPI was introduced to the bridge in commitbdced7ef78
("bridge: support for multiple vlans and vlan ranges in setlink and dellink requests") (Jan 10 2015). But the VLAN ranges (parsed in br_afspec) have always been passed one by one, through struct bridge_vlan_info tmp_vinfo, to br_vlan_info. So the range never went too far in depth. Then Scott Feldman introduced the switchdev_port_bridge_setlink function in commit47f8328bb1
("switchdev: add new switchdev bridge setlink"). That marked the introduction of the SWITCHDEV_OBJ_PORT_VLAN, which made full use of the range. But switchdev_port_bridge_setlink was called like this: br_setlink -> br_afspec -> switchdev_port_bridge_setlink Basically, the switchdev and the bridge code were not tightly integrated. Then commit41c498b935
("bridge: restore br_setlink back to original") came, and switchdev drivers were required to implement .ndo_bridge_setlink = switchdev_port_bridge_setlink for a while. In the meantime, commits such as0944d6b5a2
("bridge: try switchdev op first in __vlan_vid_add/del") finally made switchdev penetrate the br_vlan_info() barrier and start to develop the call path we have today. But remember, br_vlan_info() still receives VLANs one by one. Then Arkadi Sharshevsky refactored the switchdev API in 2017 in commit29ab586c3d
("net: switchdev: Remove bridge bypass support from switchdev") so that drivers would not implement .ndo_bridge_setlink any longer. The switchdev_port_bridge_setlink also got deleted. This refactoring removed the parallel bridge_setlink implementation from switchdev, and left the only switchdev VLAN objects to be the ones offloaded from __vlan_vid_add (basically RX filtering) and __vlan_add (the latter coming from commit9c86ce2c1a
("net: bridge: Notify about bridge VLANs")). That is to say, today the switchdev VLAN object ranges are not used in the kernel. Refactoring the above call path is a bit complicated, when the bridge VLAN call path is already a bit complicated. Let's go off and finish the job of commit29ab586c3d
by deleting the bogus iteration through the VLAN ranges from the drivers. Some aspects of this feature never made too much sense in the first place. For example, what is a range of VLANs all having the BRIDGE_VLAN_INFO_PVID flag supposed to mean, when a port can obviously have a single pvid? This particular configuration _is_ denied as of commit6623c60dc2
("bridge: vlan: enforce no pvid flag in vlan ranges"), but from an API perspective, the driver still has to play pretend, and only offload the vlan->vid_end as pvid. And the addition of a switchdev VLAN object can modify the flags of another, completely unrelated, switchdev VLAN object! (a VLAN that is PVID will invalidate the PVID flag from whatever other VLAN had previously been offloaded with switchdev and had that flag. Yet switchdev never notifies about that change, drivers are supposed to guess). Nonetheless, having a VLAN range in the API makes error handling look scarier than it really is - unwinding on errors and all of that. When in reality, no one really calls this API with more than one VLAN. It is all unnecessary complexity. And despite appearing pretentious (two-phase transactional model and all), the switchdev API is really sloppy because the VLAN addition and removal operations are not paired with one another (you can add a VLAN 100 times and delete it just once). The bridge notifies through switchdev of a VLAN addition not only when the flags of an existing VLAN change, but also when nothing changes. There are switchdev drivers out there who don't like adding a VLAN that has already been added, and those checks don't really belong at driver level. But the fact that the API contains ranges is yet another factor that prevents this from being addressed in the future. Of the existing switchdev pieces of hardware, it appears that only Mellanox Spectrum supports offloading more than one VLAN at a time, through mlxsw_sp_port_vlan_set. I have kept that code internal to the driver, because there is some more bookkeeping that makes use of it, but I deleted it from the switchdev API. But since the switchdev support for ranges has already been de facto deleted by a Mellanox employee and nobody noticed for 4 years, I'm going to assume it's not a biggie. Signed-off-by: Vladimir Oltean <vladimir.oltean@nxp.com> Reviewed-by: Ido Schimmel <idosch@nvidia.com> # switchdev and mlxsw Reviewed-by: Florian Fainelli <f.fainelli@gmail.com> Reviewed-by: Kurt Kanzenbach <kurt@linutronix.de> # hellcreek Signed-off-by: Jakub Kicinski <kuba@kernel.org>
404 lines
10 KiB
C
404 lines
10 KiB
C
/* SPDX-License-Identifier: GPL-2.0-or-later */
|
|
/*
|
|
* include/net/switchdev.h - Switch device API
|
|
* Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
|
|
* Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
|
|
*/
|
|
#ifndef _LINUX_SWITCHDEV_H_
|
|
#define _LINUX_SWITCHDEV_H_
|
|
|
|
#include <linux/netdevice.h>
|
|
#include <linux/notifier.h>
|
|
#include <linux/list.h>
|
|
#include <net/ip_fib.h>
|
|
|
|
#define SWITCHDEV_F_NO_RECURSE BIT(0)
|
|
#define SWITCHDEV_F_SKIP_EOPNOTSUPP BIT(1)
|
|
#define SWITCHDEV_F_DEFER BIT(2)
|
|
|
|
struct switchdev_trans {
|
|
bool ph_prepare;
|
|
};
|
|
|
|
static inline bool switchdev_trans_ph_prepare(struct switchdev_trans *trans)
|
|
{
|
|
return trans && trans->ph_prepare;
|
|
}
|
|
|
|
static inline bool switchdev_trans_ph_commit(struct switchdev_trans *trans)
|
|
{
|
|
return trans && !trans->ph_prepare;
|
|
}
|
|
|
|
enum switchdev_attr_id {
|
|
SWITCHDEV_ATTR_ID_UNDEFINED,
|
|
SWITCHDEV_ATTR_ID_PORT_STP_STATE,
|
|
SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
|
|
SWITCHDEV_ATTR_ID_PORT_PRE_BRIDGE_FLAGS,
|
|
SWITCHDEV_ATTR_ID_PORT_MROUTER,
|
|
SWITCHDEV_ATTR_ID_BRIDGE_AGEING_TIME,
|
|
SWITCHDEV_ATTR_ID_BRIDGE_VLAN_FILTERING,
|
|
SWITCHDEV_ATTR_ID_BRIDGE_VLAN_PROTOCOL,
|
|
SWITCHDEV_ATTR_ID_BRIDGE_MC_DISABLED,
|
|
SWITCHDEV_ATTR_ID_BRIDGE_MROUTER,
|
|
#if IS_ENABLED(CONFIG_BRIDGE_MRP)
|
|
SWITCHDEV_ATTR_ID_MRP_PORT_STATE,
|
|
SWITCHDEV_ATTR_ID_MRP_PORT_ROLE,
|
|
#endif
|
|
};
|
|
|
|
struct switchdev_attr {
|
|
struct net_device *orig_dev;
|
|
enum switchdev_attr_id id;
|
|
u32 flags;
|
|
void *complete_priv;
|
|
void (*complete)(struct net_device *dev, int err, void *priv);
|
|
union {
|
|
u8 stp_state; /* PORT_STP_STATE */
|
|
unsigned long brport_flags; /* PORT_{PRE}_BRIDGE_FLAGS */
|
|
bool mrouter; /* PORT_MROUTER */
|
|
clock_t ageing_time; /* BRIDGE_AGEING_TIME */
|
|
bool vlan_filtering; /* BRIDGE_VLAN_FILTERING */
|
|
u16 vlan_protocol; /* BRIDGE_VLAN_PROTOCOL */
|
|
bool mc_disabled; /* MC_DISABLED */
|
|
#if IS_ENABLED(CONFIG_BRIDGE_MRP)
|
|
u8 mrp_port_state; /* MRP_PORT_STATE */
|
|
u8 mrp_port_role; /* MRP_PORT_ROLE */
|
|
#endif
|
|
} u;
|
|
};
|
|
|
|
enum switchdev_obj_id {
|
|
SWITCHDEV_OBJ_ID_UNDEFINED,
|
|
SWITCHDEV_OBJ_ID_PORT_VLAN,
|
|
SWITCHDEV_OBJ_ID_PORT_MDB,
|
|
SWITCHDEV_OBJ_ID_HOST_MDB,
|
|
#if IS_ENABLED(CONFIG_BRIDGE_MRP)
|
|
SWITCHDEV_OBJ_ID_MRP,
|
|
SWITCHDEV_OBJ_ID_RING_TEST_MRP,
|
|
SWITCHDEV_OBJ_ID_RING_ROLE_MRP,
|
|
SWITCHDEV_OBJ_ID_RING_STATE_MRP,
|
|
SWITCHDEV_OBJ_ID_IN_TEST_MRP,
|
|
SWITCHDEV_OBJ_ID_IN_ROLE_MRP,
|
|
SWITCHDEV_OBJ_ID_IN_STATE_MRP,
|
|
|
|
#endif
|
|
};
|
|
|
|
struct switchdev_obj {
|
|
struct net_device *orig_dev;
|
|
enum switchdev_obj_id id;
|
|
u32 flags;
|
|
void *complete_priv;
|
|
void (*complete)(struct net_device *dev, int err, void *priv);
|
|
};
|
|
|
|
/* SWITCHDEV_OBJ_ID_PORT_VLAN */
|
|
struct switchdev_obj_port_vlan {
|
|
struct switchdev_obj obj;
|
|
u16 flags;
|
|
u16 vid;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_PORT_VLAN(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_port_vlan, obj)
|
|
|
|
/* SWITCHDEV_OBJ_ID_PORT_MDB */
|
|
struct switchdev_obj_port_mdb {
|
|
struct switchdev_obj obj;
|
|
unsigned char addr[ETH_ALEN];
|
|
u16 vid;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_PORT_MDB(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_port_mdb, obj)
|
|
|
|
|
|
#if IS_ENABLED(CONFIG_BRIDGE_MRP)
|
|
/* SWITCHDEV_OBJ_ID_MRP */
|
|
struct switchdev_obj_mrp {
|
|
struct switchdev_obj obj;
|
|
struct net_device *p_port;
|
|
struct net_device *s_port;
|
|
u32 ring_id;
|
|
u16 prio;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_mrp, obj)
|
|
|
|
/* SWITCHDEV_OBJ_ID_RING_TEST_MRP */
|
|
struct switchdev_obj_ring_test_mrp {
|
|
struct switchdev_obj obj;
|
|
/* The value is in us and a value of 0 represents to stop */
|
|
u32 interval;
|
|
u8 max_miss;
|
|
u32 ring_id;
|
|
u32 period;
|
|
bool monitor;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_RING_TEST_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_ring_test_mrp, obj)
|
|
|
|
/* SWICHDEV_OBJ_ID_RING_ROLE_MRP */
|
|
struct switchdev_obj_ring_role_mrp {
|
|
struct switchdev_obj obj;
|
|
u8 ring_role;
|
|
u32 ring_id;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_RING_ROLE_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_ring_role_mrp, obj)
|
|
|
|
struct switchdev_obj_ring_state_mrp {
|
|
struct switchdev_obj obj;
|
|
u8 ring_state;
|
|
u32 ring_id;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_RING_STATE_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_ring_state_mrp, obj)
|
|
|
|
/* SWITCHDEV_OBJ_ID_IN_TEST_MRP */
|
|
struct switchdev_obj_in_test_mrp {
|
|
struct switchdev_obj obj;
|
|
/* The value is in us and a value of 0 represents to stop */
|
|
u32 interval;
|
|
u32 in_id;
|
|
u32 period;
|
|
u8 max_miss;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_IN_TEST_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_in_test_mrp, obj)
|
|
|
|
/* SWICHDEV_OBJ_ID_IN_ROLE_MRP */
|
|
struct switchdev_obj_in_role_mrp {
|
|
struct switchdev_obj obj;
|
|
struct net_device *i_port;
|
|
u32 ring_id;
|
|
u16 in_id;
|
|
u8 in_role;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_IN_ROLE_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_in_role_mrp, obj)
|
|
|
|
struct switchdev_obj_in_state_mrp {
|
|
struct switchdev_obj obj;
|
|
u32 in_id;
|
|
u8 in_state;
|
|
};
|
|
|
|
#define SWITCHDEV_OBJ_IN_STATE_MRP(OBJ) \
|
|
container_of((OBJ), struct switchdev_obj_in_state_mrp, obj)
|
|
|
|
#endif
|
|
|
|
typedef int switchdev_obj_dump_cb_t(struct switchdev_obj *obj);
|
|
|
|
enum switchdev_notifier_type {
|
|
SWITCHDEV_FDB_ADD_TO_BRIDGE = 1,
|
|
SWITCHDEV_FDB_DEL_TO_BRIDGE,
|
|
SWITCHDEV_FDB_ADD_TO_DEVICE,
|
|
SWITCHDEV_FDB_DEL_TO_DEVICE,
|
|
SWITCHDEV_FDB_OFFLOADED,
|
|
SWITCHDEV_FDB_FLUSH_TO_BRIDGE,
|
|
|
|
SWITCHDEV_PORT_OBJ_ADD, /* Blocking. */
|
|
SWITCHDEV_PORT_OBJ_DEL, /* Blocking. */
|
|
SWITCHDEV_PORT_ATTR_SET, /* May be blocking . */
|
|
|
|
SWITCHDEV_VXLAN_FDB_ADD_TO_BRIDGE,
|
|
SWITCHDEV_VXLAN_FDB_DEL_TO_BRIDGE,
|
|
SWITCHDEV_VXLAN_FDB_ADD_TO_DEVICE,
|
|
SWITCHDEV_VXLAN_FDB_DEL_TO_DEVICE,
|
|
SWITCHDEV_VXLAN_FDB_OFFLOADED,
|
|
};
|
|
|
|
struct switchdev_notifier_info {
|
|
struct net_device *dev;
|
|
struct netlink_ext_ack *extack;
|
|
};
|
|
|
|
struct switchdev_notifier_fdb_info {
|
|
struct switchdev_notifier_info info; /* must be first */
|
|
const unsigned char *addr;
|
|
u16 vid;
|
|
u8 added_by_user:1,
|
|
offloaded:1;
|
|
};
|
|
|
|
struct switchdev_notifier_port_obj_info {
|
|
struct switchdev_notifier_info info; /* must be first */
|
|
const struct switchdev_obj *obj;
|
|
struct switchdev_trans *trans;
|
|
bool handled;
|
|
};
|
|
|
|
struct switchdev_notifier_port_attr_info {
|
|
struct switchdev_notifier_info info; /* must be first */
|
|
const struct switchdev_attr *attr;
|
|
struct switchdev_trans *trans;
|
|
bool handled;
|
|
};
|
|
|
|
static inline struct net_device *
|
|
switchdev_notifier_info_to_dev(const struct switchdev_notifier_info *info)
|
|
{
|
|
return info->dev;
|
|
}
|
|
|
|
static inline struct netlink_ext_ack *
|
|
switchdev_notifier_info_to_extack(const struct switchdev_notifier_info *info)
|
|
{
|
|
return info->extack;
|
|
}
|
|
|
|
#ifdef CONFIG_NET_SWITCHDEV
|
|
|
|
void switchdev_deferred_process(void);
|
|
int switchdev_port_attr_set(struct net_device *dev,
|
|
const struct switchdev_attr *attr);
|
|
int switchdev_port_obj_add(struct net_device *dev,
|
|
const struct switchdev_obj *obj,
|
|
struct netlink_ext_ack *extack);
|
|
int switchdev_port_obj_del(struct net_device *dev,
|
|
const struct switchdev_obj *obj);
|
|
|
|
int register_switchdev_notifier(struct notifier_block *nb);
|
|
int unregister_switchdev_notifier(struct notifier_block *nb);
|
|
int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
|
|
struct switchdev_notifier_info *info,
|
|
struct netlink_ext_ack *extack);
|
|
|
|
int register_switchdev_blocking_notifier(struct notifier_block *nb);
|
|
int unregister_switchdev_blocking_notifier(struct notifier_block *nb);
|
|
int call_switchdev_blocking_notifiers(unsigned long val, struct net_device *dev,
|
|
struct switchdev_notifier_info *info,
|
|
struct netlink_ext_ack *extack);
|
|
|
|
void switchdev_port_fwd_mark_set(struct net_device *dev,
|
|
struct net_device *group_dev,
|
|
bool joining);
|
|
|
|
int switchdev_handle_port_obj_add(struct net_device *dev,
|
|
struct switchdev_notifier_port_obj_info *port_obj_info,
|
|
bool (*check_cb)(const struct net_device *dev),
|
|
int (*add_cb)(struct net_device *dev,
|
|
const struct switchdev_obj *obj,
|
|
struct switchdev_trans *trans,
|
|
struct netlink_ext_ack *extack));
|
|
int switchdev_handle_port_obj_del(struct net_device *dev,
|
|
struct switchdev_notifier_port_obj_info *port_obj_info,
|
|
bool (*check_cb)(const struct net_device *dev),
|
|
int (*del_cb)(struct net_device *dev,
|
|
const struct switchdev_obj *obj));
|
|
|
|
int switchdev_handle_port_attr_set(struct net_device *dev,
|
|
struct switchdev_notifier_port_attr_info *port_attr_info,
|
|
bool (*check_cb)(const struct net_device *dev),
|
|
int (*set_cb)(struct net_device *dev,
|
|
const struct switchdev_attr *attr,
|
|
struct switchdev_trans *trans));
|
|
#else
|
|
|
|
static inline void switchdev_deferred_process(void)
|
|
{
|
|
}
|
|
|
|
static inline int switchdev_port_attr_set(struct net_device *dev,
|
|
const struct switchdev_attr *attr)
|
|
{
|
|
return -EOPNOTSUPP;
|
|
}
|
|
|
|
static inline int switchdev_port_obj_add(struct net_device *dev,
|
|
const struct switchdev_obj *obj,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
return -EOPNOTSUPP;
|
|
}
|
|
|
|
static inline int switchdev_port_obj_del(struct net_device *dev,
|
|
const struct switchdev_obj *obj)
|
|
{
|
|
return -EOPNOTSUPP;
|
|
}
|
|
|
|
static inline int register_switchdev_notifier(struct notifier_block *nb)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int unregister_switchdev_notifier(struct notifier_block *nb)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int call_switchdev_notifiers(unsigned long val,
|
|
struct net_device *dev,
|
|
struct switchdev_notifier_info *info,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
return NOTIFY_DONE;
|
|
}
|
|
|
|
static inline int
|
|
register_switchdev_blocking_notifier(struct notifier_block *nb)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
unregister_switchdev_blocking_notifier(struct notifier_block *nb)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
call_switchdev_blocking_notifiers(unsigned long val,
|
|
struct net_device *dev,
|
|
struct switchdev_notifier_info *info,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
return NOTIFY_DONE;
|
|
}
|
|
|
|
static inline int
|
|
switchdev_handle_port_obj_add(struct net_device *dev,
|
|
struct switchdev_notifier_port_obj_info *port_obj_info,
|
|
bool (*check_cb)(const struct net_device *dev),
|
|
int (*add_cb)(struct net_device *dev,
|
|
const struct switchdev_obj *obj,
|
|
struct switchdev_trans *trans,
|
|
struct netlink_ext_ack *extack))
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
switchdev_handle_port_obj_del(struct net_device *dev,
|
|
struct switchdev_notifier_port_obj_info *port_obj_info,
|
|
bool (*check_cb)(const struct net_device *dev),
|
|
int (*del_cb)(struct net_device *dev,
|
|
const struct switchdev_obj *obj))
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
switchdev_handle_port_attr_set(struct net_device *dev,
|
|
struct switchdev_notifier_port_attr_info *port_attr_info,
|
|
bool (*check_cb)(const struct net_device *dev),
|
|
int (*set_cb)(struct net_device *dev,
|
|
const struct switchdev_attr *attr,
|
|
struct switchdev_trans *trans))
|
|
{
|
|
return 0;
|
|
}
|
|
#endif
|
|
|
|
#endif /* _LINUX_SWITCHDEV_H_ */
|