root/drivers/net/ethernet/mellanox/mlx5/core/en/rep/bridge.c
// SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
/* Copyright (c) 2021 Mellanox Technologies. */

#include <linux/netdevice.h>
#include <linux/if_bridge.h>
#include <net/netevent.h>
#include <net/switchdev.h>
#include "bridge.h"
#include "esw/bridge.h"
#include "en_rep.h"

#define MLX5_ESW_BRIDGE_UPDATE_INTERVAL 1000

struct mlx5_bridge_switchdev_fdb_work {
        struct work_struct work;
        struct switchdev_notifier_fdb_info fdb_info;
        struct net_device *dev;
        struct mlx5_esw_bridge_offloads *br_offloads;
        bool add;
};

static bool mlx5_esw_bridge_dev_same_esw(struct net_device *dev, struct mlx5_eswitch *esw)
{
        struct mlx5e_priv *priv = netdev_priv(dev);

        return esw == priv->mdev->priv.eswitch;
}

static bool mlx5_esw_bridge_dev_same_hw(struct net_device *dev, struct mlx5_eswitch *esw)
{
        struct mlx5e_priv *priv = netdev_priv(dev);
        struct mlx5_core_dev *mdev, *esw_mdev;

        mdev = priv->mdev;
        esw_mdev = esw->dev;

        return mlx5_same_hw_devs(mdev, esw_mdev);
}

static struct net_device *
mlx5_esw_bridge_lag_rep_get(struct net_device *dev, struct mlx5_eswitch *esw)
{
        struct net_device *lower;
        struct list_head *iter;

        netdev_for_each_lower_dev(dev, lower, iter) {
                if (!mlx5e_eswitch_rep(lower))
                        continue;

                if (mlx5_esw_bridge_dev_same_esw(lower, esw))
                        return lower;
        }

        return NULL;
}

static struct net_device *
mlx5_esw_bridge_rep_vport_num_vhca_id_get(struct net_device *dev, struct mlx5_eswitch *esw,
                                          u16 *vport_num, u16 *esw_owner_vhca_id)
{
        struct mlx5e_rep_priv *rpriv;
        struct mlx5e_priv *priv;

        if (netif_is_lag_master(dev))
                dev = mlx5_esw_bridge_lag_rep_get(dev, esw);

        if (!dev || !mlx5e_eswitch_rep(dev) || !mlx5_esw_bridge_dev_same_hw(dev, esw))
                return NULL;

        priv = netdev_priv(dev);

        if (!priv->mdev->priv.eswitch->br_offloads)
                return NULL;

        rpriv = priv->ppriv;
        *vport_num = rpriv->rep->vport;
        *esw_owner_vhca_id = MLX5_CAP_GEN(priv->mdev, vhca_id);
        return dev;
}

static struct net_device *
mlx5_esw_bridge_lower_rep_vport_num_vhca_id_get(struct net_device *dev, struct mlx5_eswitch *esw,
                                                u16 *vport_num, u16 *esw_owner_vhca_id)
{
        struct net_device *lower_dev;
        struct list_head *iter;

        if (netif_is_lag_master(dev) || mlx5e_eswitch_rep(dev))
                return mlx5_esw_bridge_rep_vport_num_vhca_id_get(dev, esw, vport_num,
                                                                 esw_owner_vhca_id);

        netdev_for_each_lower_dev(dev, lower_dev, iter) {
                struct net_device *rep;

                if (netif_is_bridge_master(lower_dev))
                        continue;

                rep = mlx5_esw_bridge_lower_rep_vport_num_vhca_id_get(lower_dev, esw, vport_num,
                                                                      esw_owner_vhca_id);
                if (rep)
                        return rep;
        }

        return NULL;
}

static bool mlx5_esw_bridge_is_local(struct net_device *dev, struct net_device *rep,
                                     struct mlx5_eswitch *esw)
{
        struct mlx5_core_dev *mdev;
        struct mlx5e_priv *priv;

        if (!mlx5_esw_bridge_dev_same_esw(rep, esw))
                return false;

        priv = netdev_priv(rep);
        mdev = priv->mdev;
        if (netif_is_lag_master(dev))
                return mlx5_lag_is_master(mdev);
        return true;
}

static int mlx5_esw_bridge_port_changeupper(struct notifier_block *nb, void *ptr)
{
        struct mlx5_esw_bridge_offloads *br_offloads = container_of(nb,
                                                                    struct mlx5_esw_bridge_offloads,
                                                                    netdev_nb);
        struct net_device *dev = netdev_notifier_info_to_dev(ptr);
        struct netdev_notifier_changeupper_info *info = ptr;
        struct net_device *upper = info->upper_dev, *rep;
        struct mlx5_eswitch *esw = br_offloads->esw;
        u16 vport_num, esw_owner_vhca_id;
        struct netlink_ext_ack *extack;
        int err = 0;

        if (!netif_is_bridge_master(upper))
                return 0;

        rep = mlx5_esw_bridge_rep_vport_num_vhca_id_get(dev, esw, &vport_num, &esw_owner_vhca_id);
        if (!rep)
                return 0;

        extack = netdev_notifier_info_to_extack(&info->info);

        if (mlx5_esw_bridge_is_local(dev, rep, esw))
                err = info->linking ?
                        mlx5_esw_bridge_vport_link(upper, vport_num, esw_owner_vhca_id,
                                                   br_offloads, extack) :
                        mlx5_esw_bridge_vport_unlink(upper, vport_num, esw_owner_vhca_id,
                                                     br_offloads, extack);
        else if (mlx5_esw_bridge_dev_same_hw(rep, esw))
                err = info->linking ?
                        mlx5_esw_bridge_vport_peer_link(upper, vport_num, esw_owner_vhca_id,
                                                        br_offloads, extack) :
                        mlx5_esw_bridge_vport_peer_unlink(upper, vport_num, esw_owner_vhca_id,
                                                          br_offloads, extack);

        return err;
}

static int
mlx5_esw_bridge_changeupper_validate_netdev(void *ptr)
{
        struct net_device *dev = netdev_notifier_info_to_dev(ptr);
        struct netdev_notifier_changeupper_info *info = ptr;
        struct net_device *upper = info->upper_dev;
        struct net_device *lower;
        struct list_head *iter;

        if (!netif_is_bridge_master(upper) || !netif_is_lag_master(dev))
                return 0;

        netdev_for_each_lower_dev(dev, lower, iter) {
                struct mlx5_core_dev *mdev;
                struct mlx5e_priv *priv;

                if (!mlx5e_eswitch_rep(lower))
                        continue;

                priv = netdev_priv(lower);
                mdev = priv->mdev;
                if (!mlx5_lag_is_active(mdev))
                        return -EAGAIN;
                if (!mlx5_lag_is_shared_fdb(mdev))
                        return -EOPNOTSUPP;
        }

        return 0;
}

static int mlx5_esw_bridge_switchdev_port_event(struct notifier_block *nb,
                                                unsigned long event, void *ptr)
{
        int err = 0;

        switch (event) {
        case NETDEV_PRECHANGEUPPER:
                err = mlx5_esw_bridge_changeupper_validate_netdev(ptr);
                break;

        case NETDEV_CHANGEUPPER:
                err = mlx5_esw_bridge_port_changeupper(nb, ptr);
                break;
        }

        return notifier_from_errno(err);
}

static int
mlx5_esw_bridge_port_obj_add(struct net_device *dev,
                             struct switchdev_notifier_port_obj_info *port_obj_info,
                             struct mlx5_esw_bridge_offloads *br_offloads)
{
        struct netlink_ext_ack *extack = switchdev_notifier_info_to_extack(&port_obj_info->info);
        const struct switchdev_obj *obj = port_obj_info->obj;
        const struct switchdev_obj_port_vlan *vlan;
        const struct switchdev_obj_port_mdb *mdb;
        u16 vport_num, esw_owner_vhca_id;
        int err;

        if (!mlx5_esw_bridge_rep_vport_num_vhca_id_get(dev, br_offloads->esw, &vport_num,
                                                       &esw_owner_vhca_id))
                return 0;

        port_obj_info->handled = true;

        switch (obj->id) {
        case SWITCHDEV_OBJ_ID_PORT_VLAN:
                vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
                err = mlx5_esw_bridge_port_vlan_add(vport_num, esw_owner_vhca_id, vlan->vid,
                                                    vlan->flags, br_offloads, extack);
                break;
        case SWITCHDEV_OBJ_ID_PORT_MDB:
                mdb = SWITCHDEV_OBJ_PORT_MDB(obj);
                err = mlx5_esw_bridge_port_mdb_add(dev, vport_num, esw_owner_vhca_id, mdb->addr,
                                                   mdb->vid, br_offloads, extack);
                break;
        default:
                return -EOPNOTSUPP;
        }
        return err;
}

static int
mlx5_esw_bridge_port_obj_del(struct net_device *dev,
                             struct switchdev_notifier_port_obj_info *port_obj_info,
                             struct mlx5_esw_bridge_offloads *br_offloads)
{
        const struct switchdev_obj *obj = port_obj_info->obj;
        const struct switchdev_obj_port_vlan *vlan;
        const struct switchdev_obj_port_mdb *mdb;
        u16 vport_num, esw_owner_vhca_id;

        if (!mlx5_esw_bridge_rep_vport_num_vhca_id_get(dev, br_offloads->esw, &vport_num,
                                                       &esw_owner_vhca_id))
                return 0;

        port_obj_info->handled = true;

        switch (obj->id) {
        case SWITCHDEV_OBJ_ID_PORT_VLAN:
                vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
                mlx5_esw_bridge_port_vlan_del(vport_num, esw_owner_vhca_id, vlan->vid, br_offloads);
                break;
        case SWITCHDEV_OBJ_ID_PORT_MDB:
                mdb = SWITCHDEV_OBJ_PORT_MDB(obj);
                mlx5_esw_bridge_port_mdb_del(dev, vport_num, esw_owner_vhca_id, mdb->addr, mdb->vid,
                                             br_offloads);
                break;
        default:
                return -EOPNOTSUPP;
        }
        return 0;
}

static int
mlx5_esw_bridge_port_obj_attr_set(struct net_device *dev,
                                  struct switchdev_notifier_port_attr_info *port_attr_info,
                                  struct mlx5_esw_bridge_offloads *br_offloads)
{
        struct netlink_ext_ack *extack = switchdev_notifier_info_to_extack(&port_attr_info->info);
        const struct switchdev_attr *attr = port_attr_info->attr;
        u16 vport_num, esw_owner_vhca_id;
        int err = 0;

        if (!mlx5_esw_bridge_lower_rep_vport_num_vhca_id_get(dev, br_offloads->esw, &vport_num,
                                                             &esw_owner_vhca_id))
                return 0;

        port_attr_info->handled = true;

        switch (attr->id) {
        case SWITCHDEV_ATTR_ID_PORT_PRE_BRIDGE_FLAGS:
                if (attr->u.brport_flags.mask & ~(BR_LEARNING | BR_FLOOD | BR_MCAST_FLOOD)) {
                        NL_SET_ERR_MSG_MOD(extack, "Flag is not supported");
                        err = -EINVAL;
                }
                break;
        case SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS:
                break;
        case SWITCHDEV_ATTR_ID_BRIDGE_AGEING_TIME:
                err = mlx5_esw_bridge_ageing_time_set(vport_num, esw_owner_vhca_id,
                                                      attr->u.ageing_time, br_offloads);
                break;
        case SWITCHDEV_ATTR_ID_BRIDGE_VLAN_FILTERING:
                err = mlx5_esw_bridge_vlan_filtering_set(vport_num, esw_owner_vhca_id,
                                                         attr->u.vlan_filtering, br_offloads);
                break;
        case SWITCHDEV_ATTR_ID_BRIDGE_VLAN_PROTOCOL:
                err = mlx5_esw_bridge_vlan_proto_set(vport_num,
                                                     esw_owner_vhca_id,
                                                     attr->u.vlan_protocol,
                                                     br_offloads);
                break;
        case SWITCHDEV_ATTR_ID_BRIDGE_MC_DISABLED:
                err = mlx5_esw_bridge_mcast_set(vport_num, esw_owner_vhca_id,
                                                !attr->u.mc_disabled, br_offloads);
                break;
        default:
                err = -EOPNOTSUPP;
        }

        return err;
}

static int mlx5_esw_bridge_event_blocking(struct notifier_block *nb,
                                          unsigned long event, void *ptr)
{
        struct mlx5_esw_bridge_offloads *br_offloads = container_of(nb,
                                                                    struct mlx5_esw_bridge_offloads,
                                                                    nb_blk);
        struct net_device *dev = switchdev_notifier_info_to_dev(ptr);
        int err;

        switch (event) {
        case SWITCHDEV_PORT_OBJ_ADD:
                err = mlx5_esw_bridge_port_obj_add(dev, ptr, br_offloads);
                break;
        case SWITCHDEV_PORT_OBJ_DEL:
                err = mlx5_esw_bridge_port_obj_del(dev, ptr, br_offloads);
                break;
        case SWITCHDEV_PORT_ATTR_SET:
                err = mlx5_esw_bridge_port_obj_attr_set(dev, ptr, br_offloads);
                break;
        default:
                err = 0;
        }

        return notifier_from_errno(err);
}

static void
mlx5_esw_bridge_cleanup_switchdev_fdb_work(struct mlx5_bridge_switchdev_fdb_work *fdb_work)
{
        dev_put(fdb_work->dev);
        kfree(fdb_work->fdb_info.addr);
        kfree(fdb_work);
}

static void mlx5_esw_bridge_switchdev_fdb_event_work(struct work_struct *work)
{
        struct mlx5_bridge_switchdev_fdb_work *fdb_work =
                container_of(work, struct mlx5_bridge_switchdev_fdb_work, work);
        struct switchdev_notifier_fdb_info *fdb_info =
                &fdb_work->fdb_info;
        struct mlx5_esw_bridge_offloads *br_offloads =
                fdb_work->br_offloads;
        struct net_device *dev = fdb_work->dev;
        u16 vport_num, esw_owner_vhca_id;

        rtnl_lock();

        if (!mlx5_esw_bridge_rep_vport_num_vhca_id_get(dev, br_offloads->esw, &vport_num,
                                                       &esw_owner_vhca_id))
                goto out;

        if (fdb_work->add)
                mlx5_esw_bridge_fdb_create(dev, vport_num, esw_owner_vhca_id, br_offloads,
                                           fdb_info);
        else
                mlx5_esw_bridge_fdb_remove(dev, vport_num, esw_owner_vhca_id, br_offloads,
                                           fdb_info);

out:
        rtnl_unlock();
        mlx5_esw_bridge_cleanup_switchdev_fdb_work(fdb_work);
}

static struct mlx5_bridge_switchdev_fdb_work *
mlx5_esw_bridge_init_switchdev_fdb_work(struct net_device *dev, bool add,
                                        struct switchdev_notifier_fdb_info *fdb_info,
                                        struct mlx5_esw_bridge_offloads *br_offloads)
{
        struct mlx5_bridge_switchdev_fdb_work *work;
        u8 *addr;

        work = kzalloc_obj(*work, GFP_ATOMIC);
        if (!work)
                return ERR_PTR(-ENOMEM);

        INIT_WORK(&work->work, mlx5_esw_bridge_switchdev_fdb_event_work);
        memcpy(&work->fdb_info, fdb_info, sizeof(work->fdb_info));

        addr = kzalloc(ETH_ALEN, GFP_ATOMIC);
        if (!addr) {
                kfree(work);
                return ERR_PTR(-ENOMEM);
        }
        ether_addr_copy(addr, fdb_info->addr);
        work->fdb_info.addr = addr;

        dev_hold(dev);
        work->dev = dev;
        work->br_offloads = br_offloads;
        work->add = add;
        return work;
}

static int mlx5_esw_bridge_switchdev_event(struct notifier_block *nb,
                                           unsigned long event, void *ptr)
{
        struct mlx5_esw_bridge_offloads *br_offloads = container_of(nb,
                                                                    struct mlx5_esw_bridge_offloads,
                                                                    nb);
        struct net_device *dev = switchdev_notifier_info_to_dev(ptr);
        struct switchdev_notifier_fdb_info *fdb_info;
        struct mlx5_bridge_switchdev_fdb_work *work;
        struct mlx5_eswitch *esw = br_offloads->esw;
        struct switchdev_notifier_info *info = ptr;
        u16 vport_num, esw_owner_vhca_id;
        struct net_device *upper, *rep;

        if (event == SWITCHDEV_PORT_ATTR_SET) {
                int err = mlx5_esw_bridge_port_obj_attr_set(dev, ptr, br_offloads);

                return notifier_from_errno(err);
        }

        upper = netdev_master_upper_dev_get_rcu(dev);
        if (!upper)
                return NOTIFY_DONE;
        if (!netif_is_bridge_master(upper))
                return NOTIFY_DONE;

        rep = mlx5_esw_bridge_rep_vport_num_vhca_id_get(dev, esw, &vport_num, &esw_owner_vhca_id);
        if (!rep)
                return NOTIFY_DONE;

        if (netif_is_lag_master(dev) && !mlx5_lag_is_shared_fdb(esw->dev))
                return NOTIFY_DONE;

        switch (event) {
        case SWITCHDEV_FDB_ADD_TO_BRIDGE:
                fdb_info = container_of(info,
                                        struct switchdev_notifier_fdb_info,
                                        info);
                mlx5_esw_bridge_fdb_update_used(dev, vport_num, esw_owner_vhca_id, br_offloads,
                                                fdb_info);
                break;
        case SWITCHDEV_FDB_DEL_TO_BRIDGE:
                /* only handle the event on peers */
                if (mlx5_esw_bridge_is_local(dev, rep, esw))
                        break;

                fdb_info = container_of(info,
                                        struct switchdev_notifier_fdb_info,
                                        info);
                /* Mark for deletion to prevent the update wq task from
                 * spuriously refreshing the entry which would mark it again as
                 * offloaded in SW bridge. After this fallthrough to regular
                 * async delete code.
                 */
                mlx5_esw_bridge_fdb_mark_deleted(dev, vport_num, esw_owner_vhca_id, br_offloads,
                                                 fdb_info);
                fallthrough;
        case SWITCHDEV_FDB_ADD_TO_DEVICE:
        case SWITCHDEV_FDB_DEL_TO_DEVICE:
                fdb_info = container_of(info,
                                        struct switchdev_notifier_fdb_info,
                                        info);

                work = mlx5_esw_bridge_init_switchdev_fdb_work(dev,
                                                               event == SWITCHDEV_FDB_ADD_TO_DEVICE,
                                                               fdb_info,
                                                               br_offloads);
                if (IS_ERR(work)) {
                        WARN_ONCE(1, "Failed to init switchdev work, err=%pe",
                                  work);
                        return notifier_from_errno(PTR_ERR(work));
                }

                queue_work(br_offloads->wq, &work->work);
                break;
        default:
                break;
        }
        return NOTIFY_DONE;
}

static void mlx5_esw_bridge_update_work(struct work_struct *work)
{
        struct mlx5_esw_bridge_offloads *br_offloads = container_of(work,
                                                                    struct mlx5_esw_bridge_offloads,
                                                                    update_work.work);

        rtnl_lock();
        mlx5_esw_bridge_update(br_offloads);
        rtnl_unlock();

        queue_delayed_work(br_offloads->wq, &br_offloads->update_work,
                           msecs_to_jiffies(MLX5_ESW_BRIDGE_UPDATE_INTERVAL));
}

void mlx5e_rep_bridge_init(struct mlx5e_priv *priv)
{
        struct mlx5_esw_bridge_offloads *br_offloads;
        struct mlx5_core_dev *mdev = priv->mdev;
        struct mlx5_eswitch *esw =
                mdev->priv.eswitch;
        int err;

        rtnl_lock();
        br_offloads = mlx5_esw_bridge_init(esw);
        rtnl_unlock();
        if (IS_ERR(br_offloads)) {
                esw_warn(mdev, "Failed to init esw bridge (err=%pe)\n",
                         br_offloads);
                return;
        }

        br_offloads->wq = alloc_ordered_workqueue("mlx5_bridge_wq", 0);
        if (!br_offloads->wq) {
                esw_warn(mdev, "Failed to allocate bridge offloads workqueue\n");
                goto err_alloc_wq;
        }

        br_offloads->nb.notifier_call = mlx5_esw_bridge_switchdev_event;
        err = register_switchdev_notifier(&br_offloads->nb);
        if (err) {
                esw_warn(mdev, "Failed to register switchdev notifier (err=%d)\n", err);
                goto err_register_swdev;
        }

        br_offloads->nb_blk.notifier_call = mlx5_esw_bridge_event_blocking;
        err = register_switchdev_blocking_notifier(&br_offloads->nb_blk);
        if (err) {
                esw_warn(mdev, "Failed to register blocking switchdev notifier (err=%d)\n", err);
                goto err_register_swdev_blk;
        }

        br_offloads->netdev_nb.notifier_call = mlx5_esw_bridge_switchdev_port_event;
        err = register_netdevice_notifier_net(&init_net, &br_offloads->netdev_nb);
        if (err) {
                esw_warn(mdev, "Failed to register bridge offloads netdevice notifier (err=%d)\n",
                         err);
                goto err_register_netdev;
        }
        INIT_DELAYED_WORK(&br_offloads->update_work, mlx5_esw_bridge_update_work);
        queue_delayed_work(br_offloads->wq, &br_offloads->update_work,
                           msecs_to_jiffies(MLX5_ESW_BRIDGE_UPDATE_INTERVAL));
        return;

err_register_netdev:
        unregister_switchdev_blocking_notifier(&br_offloads->nb_blk);
err_register_swdev_blk:
        unregister_switchdev_notifier(&br_offloads->nb);
err_register_swdev:
        destroy_workqueue(br_offloads->wq);
err_alloc_wq:
        rtnl_lock();
        mlx5_esw_bridge_cleanup(esw);
        rtnl_unlock();
}

void mlx5e_rep_bridge_cleanup(struct mlx5e_priv *priv)
{
        struct mlx5_esw_bridge_offloads *br_offloads;
        struct mlx5_core_dev *mdev = priv->mdev;
        struct mlx5_eswitch *esw =
                mdev->priv.eswitch;

        br_offloads = esw->br_offloads;
        if (!br_offloads)
                return;

        cancel_delayed_work_sync(&br_offloads->update_work);
        unregister_netdevice_notifier_net(&init_net, &br_offloads->netdev_nb);
        unregister_switchdev_blocking_notifier(&br_offloads->nb_blk);
        unregister_switchdev_notifier(&br_offloads->nb);
        destroy_workqueue(br_offloads->wq);
        rtnl_lock();
        mlx5_esw_bridge_cleanup(esw);
        rtnl_unlock();
}