root/sys/dev/mlx5/mlx5_en/mlx5_en_flow_table.c
/*-
 * Copyright (c) 2015-2021 Mellanox Technologies. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */

#include "opt_rss.h"
#include "opt_ratelimit.h"

#include <dev/mlx5/mlx5_en/en.h>
#include <dev/mlx5/mlx5_accel/ipsec.h>

#include <linux/list.h>
#include <dev/mlx5/fs.h>
#include <dev/mlx5/mpfs.h>
#include <dev/mlx5/mlx5_core/fs_tcp.h>

/*
 * The flow tables with rules define the packet processing on receive.
 * Currently the following structure is set up to handle different
 * offloads like TLS RX offload, VLAN decapsulation, packet
 * classification, RSS hashing, VxLAN checksum offloading:
 *
 *   +=========+       +=========+      +=================+
 *   |TCP/IPv4 |       |TCP/IPv4 |      |TCP/IPv4 Match   |
 *   |Flowtable|------>|         |----->|Outer Proto Match|=====> TLS TIR n
 *   |         |       |Catch-all|\     |                 |
 *   +=========+       +=========+|     +=================+
 *                                |
 *       +------------------------+
 *       V
 *   +=========+       +=========+      +=================+
 *   |TCP/IPv6 |       |TCP/IPv6 |      |TCP/IPv6 Match   |
 *   |Flowtable|------>|         |----->|Outer Proto Match|=====> TLS TIR n
 *   |         |       |Catch-all|\     |                 |
 *   +=========+       +=========+|     +=================+
 *                                |
 *       +------------------------+
 *       V
 *   +=========+       +=========+      +=================+
 *   |VLAN ft: |       |VxLAN    |      |VxLAN Main       |
 *   |CTAG/STAG|------>|      VNI|----->|Inner Proto Match|=====> Inner TIR n
 *   |VID/noVID|/      |Catch-all|\     |                 |
 *   +=========+       +=========+|     +=================+
 *                                |
 *                                |
 *                                |
 *                                v
 *                      +=================+
 *                      |Main             |
 *                      |Outer Proto Match|=====> TIR n
 *                      |                 |
 *                      +=================+
 *
 * The path through flow rules directs each packet into an appropriate TIR,
 * according to the:
 * - VLAN encapsulation
 * - Outer protocol
 * - Presence of inner protocol
 */

#define MLX5_SET_CFG(p, f, v) MLX5_SET(create_flow_group_in, p, f, v)

enum {
        MLX5E_FULLMATCH = 0,
        MLX5E_ALLMULTI = 1,
        MLX5E_PROMISC = 2,
};

enum {
        MLX5E_UC = 0,
        MLX5E_MC_IPV4 = 1,
        MLX5E_MC_IPV6 = 2,
        MLX5E_MC_OTHER = 3,
};

enum {
        MLX5E_ACTION_NONE = 0,
        MLX5E_ACTION_ADD = 1,
        MLX5E_ACTION_DEL = 2,
};

struct mlx5e_eth_addr_hash_node {
        LIST_ENTRY(mlx5e_eth_addr_hash_node) hlist;
        u8      action;
        u32     mpfs_index;
        struct mlx5e_eth_addr_info ai;
};

static void mlx5e_del_all_vlan_rules(struct mlx5e_priv *);

static inline int
mlx5e_hash_eth_addr(const u8 * addr)
{
        return (addr[5]);
}

static bool
mlx5e_add_eth_addr_to_hash(struct mlx5e_eth_addr_hash_head *hash,
    struct mlx5e_eth_addr_hash_node *hn_new)
{
        struct mlx5e_eth_addr_hash_node *hn;
        u32 ix = mlx5e_hash_eth_addr(hn_new->ai.addr);

        LIST_FOREACH(hn, &hash[ix], hlist) {
                if (bcmp(hn->ai.addr, hn_new->ai.addr, ETHER_ADDR_LEN) == 0) {
                        if (hn->action == MLX5E_ACTION_DEL)
                                hn->action = MLX5E_ACTION_NONE;
                        free(hn_new, M_MLX5EN);
                        return (false);
                }
        }
        LIST_INSERT_HEAD(&hash[ix], hn_new, hlist);
        return (true);
}

static void
mlx5e_del_eth_addr_from_hash(struct mlx5e_eth_addr_hash_node *hn)
{
        LIST_REMOVE(hn, hlist);
        free(hn, M_MLX5EN);
}

static void
mlx5e_del_eth_addr_from_flow_table(struct mlx5e_priv *priv,
    struct mlx5e_eth_addr_info *ai)
{
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV6_IPSEC_ESP]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV4_IPSEC_ESP]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV6_IPSEC_AH]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV4_IPSEC_AH]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV6_TCP]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV4_TCP]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV6_UDP]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV4_UDP]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV6]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_IPV4]);
        mlx5_del_flow_rules(&ai->ft_rule[MLX5E_TT_ANY]);
}

static int
mlx5e_get_eth_addr_type(const u8 * addr)
{
        if (ETHER_IS_MULTICAST(addr) == 0)
                return (MLX5E_UC);

        if ((addr[0] == 0x01) &&
            (addr[1] == 0x00) &&
            (addr[2] == 0x5e) &&
            !(addr[3] & 0x80))
                return (MLX5E_MC_IPV4);

        if ((addr[0] == 0x33) &&
            (addr[1] == 0x33))
                return (MLX5E_MC_IPV6);

        return (MLX5E_MC_OTHER);
}

static  u32
mlx5e_get_tt_vec(struct mlx5e_eth_addr_info *ai, int type)
{
        int eth_addr_type;
        u32 ret;

        switch (type) {
        case MLX5E_FULLMATCH:
                eth_addr_type = mlx5e_get_eth_addr_type(ai->addr);
                switch (eth_addr_type) {
                case MLX5E_UC:
                        ret =
                            (1 << MLX5E_TT_IPV4_TCP) |
                            (1 << MLX5E_TT_IPV6_TCP) |
                            (1 << MLX5E_TT_IPV4_UDP) |
                            (1 << MLX5E_TT_IPV6_UDP) |
                            (1 << MLX5E_TT_IPV4) |
                            (1 << MLX5E_TT_IPV6) |
                            (1 << MLX5E_TT_ANY) |
                            0;
                        break;

                case MLX5E_MC_IPV4:
                        ret =
                            (1 << MLX5E_TT_IPV4_UDP) |
                            (1 << MLX5E_TT_IPV4) |
                            0;
                        break;

                case MLX5E_MC_IPV6:
                        ret =
                            (1 << MLX5E_TT_IPV6_UDP) |
                            (1 << MLX5E_TT_IPV6) |
                            0;
                        break;

                default:
                        ret =
                            (1 << MLX5E_TT_ANY) |
                            0;
                        break;
                }
                break;

        case MLX5E_ALLMULTI:
                ret =
                    (1 << MLX5E_TT_IPV4_UDP) |
                    (1 << MLX5E_TT_IPV6_UDP) |
                    (1 << MLX5E_TT_IPV4) |
                    (1 << MLX5E_TT_IPV6) |
                    (1 << MLX5E_TT_ANY) |
                    0;
                break;

        default:                        /* MLX5E_PROMISC */
                ret =
                    (1 << MLX5E_TT_IPV4_TCP) |
                    (1 << MLX5E_TT_IPV6_TCP) |
                    (1 << MLX5E_TT_IPV4_UDP) |
                    (1 << MLX5E_TT_IPV6_UDP) |
                    (1 << MLX5E_TT_IPV4) |
                    (1 << MLX5E_TT_IPV6) |
                    (1 << MLX5E_TT_ANY) |
                    0;
                break;
        }

        return (ret);
}

static int
mlx5e_add_eth_addr_rule_sub(struct mlx5e_priv *priv,
    struct mlx5e_eth_addr_info *ai, int type,
    struct mlx5_flow_spec *spec)
{
        struct mlx5_flow_destination dest = {};
        u8 mc_enable = 0;
        struct mlx5_flow_handle **rule_p;
        struct mlx5_flow_table *ft = priv->fts.main.t;
        u8 *mc_dmac = MLX5_ADDR_OF(fte_match_param, spec->match_criteria,
                                   outer_headers.dmac_47_16);
        u8 *mv_dmac = MLX5_ADDR_OF(fte_match_param, spec->match_value,
                                   outer_headers.dmac_47_16);
        u32 *tirn = priv->tirn;
        u32 tt_vec;
        int err = 0;
        struct mlx5_flow_act flow_act = {
                .action = MLX5_FLOW_CONTEXT_ACTION_FWD_DEST,
        };
        u8 *mc;
        u8 *mv;

        mv = (u8 *)spec->match_value;
        mc = (u8 *)spec->match_criteria;

        spec->flow_context.flow_tag = MLX5_FS_ETH_FLOW_TAG;
        spec->flow_context.flags = FLOW_CONTEXT_HAS_TAG;
        dest.type = MLX5_FLOW_DESTINATION_TYPE_TIR;

        switch (type) {
        case MLX5E_FULLMATCH:
                mc_enable = MLX5_MATCH_OUTER_HEADERS;
                memset(mc_dmac, 0xff, ETH_ALEN);
                ether_addr_copy(mv_dmac, ai->addr);
                break;

        case MLX5E_ALLMULTI:
                mc_enable = MLX5_MATCH_OUTER_HEADERS;
                mc_dmac[0] = 0x01;
                mv_dmac[0] = 0x01;
                break;

        case MLX5E_PROMISC:
                break;
        default:
                break;
        }

        tt_vec = mlx5e_get_tt_vec(ai, type);

        spec->match_criteria_enable = mc_enable;
        if (tt_vec & BIT(MLX5E_TT_ANY)) {
                rule_p = &ai->ft_rule[MLX5E_TT_ANY];
                dest.tir_num = tirn[MLX5E_TT_ANY];
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        mc_enable = MLX5_MATCH_OUTER_HEADERS;
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);

        spec->match_criteria_enable = mc_enable;
        if (tt_vec & BIT(MLX5E_TT_IPV4)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV4];
                dest.tir_num = tirn[MLX5E_TT_IPV4];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IP);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        if (tt_vec & BIT(MLX5E_TT_IPV6)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV6];
                dest.tir_num = tirn[MLX5E_TT_IPV6];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IPV6);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        MLX5_SET(fte_match_param, mv, outer_headers.ip_protocol, IPPROTO_UDP);

        if (tt_vec & BIT(MLX5E_TT_IPV4_UDP)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV4_UDP];
                dest.tir_num = tirn[MLX5E_TT_IPV4_UDP];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IP);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        if (tt_vec & BIT(MLX5E_TT_IPV6_UDP)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV6_UDP];
                dest.tir_num = tirn[MLX5E_TT_IPV6_UDP];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IPV6);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        MLX5_SET(fte_match_param, mv, outer_headers.ip_protocol, IPPROTO_TCP);

        if (tt_vec & BIT(MLX5E_TT_IPV4_TCP)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV4_TCP];
                dest.tir_num = tirn[MLX5E_TT_IPV4_TCP];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IP);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        if (tt_vec & BIT(MLX5E_TT_IPV6_TCP)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV6_TCP];
                dest.tir_num = tirn[MLX5E_TT_IPV6_TCP];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IPV6);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        MLX5_SET(fte_match_param, mv, outer_headers.ip_protocol, IPPROTO_AH);

        if (tt_vec & BIT(MLX5E_TT_IPV4_IPSEC_AH)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV4_IPSEC_AH];
                dest.tir_num = tirn[MLX5E_TT_IPV4_IPSEC_AH];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IP);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        if (tt_vec & BIT(MLX5E_TT_IPV6_IPSEC_AH)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV6_IPSEC_AH];
                dest.tir_num = tirn[MLX5E_TT_IPV6_IPSEC_AH];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IPV6);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        MLX5_SET(fte_match_param, mv, outer_headers.ip_protocol, IPPROTO_ESP);

        if (tt_vec & BIT(MLX5E_TT_IPV4_IPSEC_ESP)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV4_IPSEC_ESP];
                dest.tir_num = tirn[MLX5E_TT_IPV4_IPSEC_ESP];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IP);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        if (tt_vec & BIT(MLX5E_TT_IPV6_IPSEC_ESP)) {
                rule_p = &ai->ft_rule[MLX5E_TT_IPV6_IPSEC_ESP];
                dest.tir_num = tirn[MLX5E_TT_IPV6_IPSEC_ESP];
                MLX5_SET(fte_match_param, mv, outer_headers.ethertype,
                         ETHERTYPE_IPV6);
                *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
                if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;
        }

        return 0;

err_del_ai:
        err = PTR_ERR(*rule_p);
        *rule_p = NULL;
        mlx5e_del_eth_addr_from_flow_table(priv, ai);

        return err;
}

static int
mlx5e_add_eth_addr_rule(struct mlx5e_priv *priv,
    struct mlx5e_eth_addr_info *ai, int type)
{
        struct mlx5_flow_spec *spec;
        int err = 0;

        spec = mlx5_vzalloc(sizeof(*spec));
        if (!spec) {
                mlx5_en_err(priv->ifp, "alloc failed\n");
                err = -ENOMEM;
                goto add_eth_addr_rule_out;
        }
        err = mlx5e_add_eth_addr_rule_sub(priv, ai, type, spec);

add_eth_addr_rule_out:
        kvfree(spec);

        return (err);
}

static void
mlx5e_del_main_vxlan_rules(struct mlx5e_priv *priv)
{
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_IPSEC_ESP]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_IPSEC_ESP]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_IPSEC_AH]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_IPSEC_AH]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_TCP]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_TCP]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_UDP]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_UDP]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV6]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_IPV4]);
        mlx5_del_flow_rules(&priv->fts.main_vxlan_rule[MLX5E_TT_ANY]);
}

static int
mlx5e_add_main_vxlan_rules_sub(struct mlx5e_priv *priv,
                               struct mlx5_flow_spec *spec)
{
        struct mlx5_flow_destination dest = {};
        struct mlx5_flow_handle **rule_p;
        struct mlx5_flow_table *ft = priv->fts.main_vxlan.t;
        u32 *tirn = priv->tirn_inner_vxlan;
        struct mlx5_flow_act flow_act = {
                .action = MLX5_FLOW_CONTEXT_ACTION_FWD_DEST,
        };
        int err = 0;
        u8 *mc;
        u8 *mv;

        spec->flow_context.flags = FLOW_CONTEXT_HAS_TAG;
        spec->flow_context.flow_tag = MLX5_FS_ETH_FLOW_TAG;

        mc = (u8 *)spec->match_criteria;
        mv = (u8 *)spec->match_value;

        dest.type = MLX5_FLOW_DESTINATION_TYPE_TIR;

        spec->match_criteria_enable = MLX5_MATCH_INNER_HEADERS;
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ethertype);

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV4];
        dest.tir_num = tirn[MLX5E_TT_IPV4];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IP);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV6];
        dest.tir_num = tirn[MLX5E_TT_IPV6];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IPV6);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ip_protocol);
        MLX5_SET(fte_match_param, mv, inner_headers.ip_protocol, IPPROTO_UDP);

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_UDP];
        dest.tir_num = tirn[MLX5E_TT_IPV4_UDP];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IP);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_UDP];
        dest.tir_num = tirn[MLX5E_TT_IPV6_UDP];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IPV6);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        MLX5_SET(fte_match_param, mv, inner_headers.ip_protocol, IPPROTO_TCP);

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_TCP];
        dest.tir_num = tirn[MLX5E_TT_IPV4_TCP];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IP);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_TCP];
        dest.tir_num = tirn[MLX5E_TT_IPV6_TCP];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IPV6);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        MLX5_SET(fte_match_param, mv, inner_headers.ip_protocol, IPPROTO_AH);

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_IPSEC_AH];
        dest.tir_num = tirn[MLX5E_TT_IPV4_IPSEC_AH];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IP);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_IPSEC_AH];
        dest.tir_num = tirn[MLX5E_TT_IPV6_IPSEC_AH];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IPV6);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        MLX5_SET(fte_match_param, mv, inner_headers.ip_protocol, IPPROTO_ESP);

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV4_IPSEC_ESP];
        dest.tir_num = tirn[MLX5E_TT_IPV4_IPSEC_ESP];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype, ETHERTYPE_IP);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                        goto err_del_ai;

        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_IPV6_IPSEC_ESP];
        dest.tir_num = tirn[MLX5E_TT_IPV6_IPSEC_ESP];
        MLX5_SET(fte_match_param, mv, inner_headers.ethertype,
                 ETHERTYPE_IPV6);
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        spec->match_criteria_enable = 0;
        memset(mv, 0, MLX5_ST_SZ_BYTES(fte_match_param));
        memset(mc, 0, MLX5_ST_SZ_BYTES(fte_match_param));
        rule_p = &priv->fts.main_vxlan_rule[MLX5E_TT_ANY];
        dest.tir_num = tirn[MLX5E_TT_ANY];
        *rule_p = mlx5_add_flow_rules(ft, NULL, &flow_act, &dest, 1);
        if (IS_ERR_OR_NULL(*rule_p))
                goto err_del_ai;

        return (0);

err_del_ai:
        err = PTR_ERR(*rule_p);
        *rule_p = NULL;
        mlx5e_del_main_vxlan_rules(priv);

        return (err);
}

static int
mlx5e_add_main_vxlan_rules(struct mlx5e_priv *priv)
{
        struct mlx5_flow_spec *spec;
        int err = 0;

        spec = mlx5_vzalloc(sizeof(*spec));
        if (!spec) {
                mlx5_en_err(priv->ifp, "alloc failed\n");
                err = -ENOMEM;
                goto add_main_vxlan_rules_out;
        }
        err = mlx5e_add_main_vxlan_rules_sub(priv, spec);

add_main_vxlan_rules_out:
        kvfree(spec);

        return (err);
}

static int mlx5e_vport_context_update_vlans(struct mlx5e_priv *priv)
{
        if_t ifp = priv->ifp;
        int max_list_size;
        int list_size;
        u16 *vlans;
        int vlan;
        int err;
        int i;

        list_size = 0;
        for_each_set_bit(vlan, priv->vlan.active_vlans, VLAN_N_VID)
                list_size++;

        max_list_size = 1 << MLX5_CAP_GEN(priv->mdev, log_max_vlan_list);

        if (list_size > max_list_size) {
                mlx5_en_err(ifp,
                            "ifnet vlans list size (%d) > (%d) max vport list size, some vlans will be dropped\n",
                            list_size, max_list_size);
                list_size = max_list_size;
        }

        vlans = kcalloc(list_size, sizeof(*vlans), GFP_KERNEL);
        if (!vlans)
                return -ENOMEM;

        i = 0;
        for_each_set_bit(vlan, priv->vlan.active_vlans, VLAN_N_VID) {
                if (i >= list_size)
                        break;
                vlans[i++] = vlan;
        }

        err = mlx5_modify_nic_vport_vlans(priv->mdev, vlans, list_size);
        if (err)
                mlx5_en_err(ifp, "Failed to modify vport vlans list err(%d)\n",
                           err);

        kfree(vlans);
        return err;
}

enum mlx5e_vlan_rule_type {
        MLX5E_VLAN_RULE_TYPE_UNTAGGED,
        MLX5E_VLAN_RULE_TYPE_ANY_CTAG_VID,
        MLX5E_VLAN_RULE_TYPE_ANY_STAG_VID,
        MLX5E_VLAN_RULE_TYPE_MATCH_VID,
};

static int
mlx5e_add_vlan_rule_sub(struct mlx5e_priv *priv,
    enum mlx5e_vlan_rule_type rule_type, u16 vid,
    struct mlx5_flow_spec *spec)
{
        struct mlx5_flow_table *ft = priv->fts.vlan.t;
        struct mlx5_flow_destination dest = {};
        struct mlx5_flow_handle **rule_p;
        int err = 0;
        struct mlx5_flow_act flow_act = {
                .action = MLX5_FLOW_CONTEXT_ACTION_FWD_DEST,
        };
        u8 *mv;
        u8 *mc;

        mv = (u8 *)spec->match_value;
        mc = (u8 *)spec->match_criteria;

        spec->flow_context.flow_tag = MLX5_FS_ETH_FLOW_TAG;
        spec->flow_context.flags = FLOW_CONTEXT_HAS_TAG;
        dest.type = MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE;
        dest.ft = priv->fts.vxlan.t;

        spec->match_criteria_enable = MLX5_MATCH_OUTER_HEADERS;

        switch (rule_type) {
        case MLX5E_VLAN_RULE_TYPE_UNTAGGED:
                rule_p = &priv->vlan.untagged_ft_rule;
                MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.cvlan_tag);
                break;
        case MLX5E_VLAN_RULE_TYPE_ANY_CTAG_VID:
                rule_p = &priv->vlan.any_cvlan_ft_rule;
                MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.cvlan_tag);
                MLX5_SET(fte_match_param, mv, outer_headers.cvlan_tag, 1);
                break;
        case MLX5E_VLAN_RULE_TYPE_ANY_STAG_VID:
                rule_p = &priv->vlan.any_svlan_ft_rule;
                MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.svlan_tag);
                MLX5_SET(fte_match_param, mv, outer_headers.svlan_tag, 1);
                break;
        default: /* MLX5E_VLAN_RULE_TYPE_MATCH_VID */
                rule_p = &priv->vlan.active_vlans_ft_rule[vid];
                MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.cvlan_tag);
                MLX5_SET(fte_match_param, mv, outer_headers.cvlan_tag, 1);
                MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.first_vid);
                MLX5_SET(fte_match_param, mv, outer_headers.first_vid, vid);
                mlx5e_vport_context_update_vlans(priv);
                break;
        }

        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);
        if (IS_ERR(*rule_p)) {
                err = PTR_ERR(*rule_p);
                *rule_p = NULL;
                mlx5_en_err(priv->ifp, "add rule failed\n");
        }

        return (err);
}

static int
mlx5e_add_vlan_rule(struct mlx5e_priv *priv,
    enum mlx5e_vlan_rule_type rule_type, u16 vid)
{
        struct mlx5_flow_spec *spec;
        int err = 0;

        spec = mlx5_vzalloc(sizeof(*spec));
        if (!spec) {
                mlx5_en_err(priv->ifp, "alloc failed\n");
                err = -ENOMEM;
                goto add_vlan_rule_out;
        }

        err = mlx5e_add_vlan_rule_sub(priv, rule_type, vid, spec);

add_vlan_rule_out:
        kvfree(spec);

        return (err);
}

static void
mlx5e_del_vlan_rule(struct mlx5e_priv *priv,
    enum mlx5e_vlan_rule_type rule_type, u16 vid)
{
        switch (rule_type) {
        case MLX5E_VLAN_RULE_TYPE_UNTAGGED:
                mlx5_del_flow_rules(&priv->vlan.untagged_ft_rule);
                break;
        case MLX5E_VLAN_RULE_TYPE_ANY_CTAG_VID:
                mlx5_del_flow_rules(&priv->vlan.any_cvlan_ft_rule);
                break;
        case MLX5E_VLAN_RULE_TYPE_ANY_STAG_VID:
                mlx5_del_flow_rules(&priv->vlan.any_svlan_ft_rule);
                break;
        case MLX5E_VLAN_RULE_TYPE_MATCH_VID:
                mlx5_del_flow_rules(&priv->vlan.active_vlans_ft_rule[vid]);
                mlx5e_vport_context_update_vlans(priv);
                break;
        default:
                break;
        }
}

static void
mlx5e_del_any_vid_rules(struct mlx5e_priv *priv)
{
        mlx5e_del_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_ANY_CTAG_VID, 0);
        mlx5e_del_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_ANY_STAG_VID, 0);
}

static int
mlx5e_add_any_vid_rules(struct mlx5e_priv *priv)
{
        int err;

        err = mlx5e_add_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_ANY_CTAG_VID, 0);
        if (err)
                return (err);

        err = mlx5e_add_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_ANY_STAG_VID, 0);
        if (err)
                mlx5e_del_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_ANY_CTAG_VID, 0);

        return (err);
}

void
mlx5e_enable_vlan_filter(struct mlx5e_priv *priv)
{
        if (priv->vlan.filter_disabled) {
                priv->vlan.filter_disabled = false;
                if (if_getflags(priv->ifp) & IFF_PROMISC)
                        return;
                if (test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                        mlx5e_del_any_vid_rules(priv);
        }
}

void
mlx5e_disable_vlan_filter(struct mlx5e_priv *priv)
{
        if (!priv->vlan.filter_disabled) {
                priv->vlan.filter_disabled = true;
                if (if_getflags(priv->ifp) & IFF_PROMISC)
                        return;
                if (test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                        mlx5e_add_any_vid_rules(priv);
        }
}

void
mlx5e_vlan_rx_add_vid(void *arg, if_t ifp, u16 vid)
{
        struct mlx5e_priv *priv = arg;

        if (ifp != priv->ifp)
                return;

        PRIV_LOCK(priv);
        if (!test_and_set_bit(vid, priv->vlan.active_vlans) &&
            test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                mlx5e_add_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_MATCH_VID, vid);
        PRIV_UNLOCK(priv);
}

void
mlx5e_vlan_rx_kill_vid(void *arg, if_t ifp, u16 vid)
{
        struct mlx5e_priv *priv = arg;

        if (ifp != priv->ifp)
                return;

        PRIV_LOCK(priv);
        clear_bit(vid, priv->vlan.active_vlans);
        if (test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                mlx5e_del_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_MATCH_VID, vid);
        PRIV_UNLOCK(priv);
}

static int
mlx5e_add_all_vlan_rules(struct mlx5e_priv *priv)
{
        int err;
        int i;

        set_bit(0, priv->vlan.active_vlans);
        for_each_set_bit(i, priv->vlan.active_vlans, VLAN_N_VID) {
                err = mlx5e_add_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_MATCH_VID,
                                          i);
                if (err)
                        goto error;
        }

        err = mlx5e_add_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_UNTAGGED, 0);
        if (err)
                goto error;

        if (priv->vlan.filter_disabled) {
                err = mlx5e_add_any_vid_rules(priv);
                if (err)
                        goto error;
        }
        return (0);
error:
        mlx5e_del_all_vlan_rules(priv);
        return (err);
}

static void
mlx5e_del_all_vlan_rules(struct mlx5e_priv *priv)
{
        int i;

        if (priv->vlan.filter_disabled)
                mlx5e_del_any_vid_rules(priv);

        mlx5e_del_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_UNTAGGED, 0);

        for_each_set_bit(i, priv->vlan.active_vlans, VLAN_N_VID)
                mlx5e_del_vlan_rule(priv, MLX5E_VLAN_RULE_TYPE_MATCH_VID, i);
        clear_bit(0, priv->vlan.active_vlans);
}

#define mlx5e_for_each_hash_node(hn, tmp, hash, i) \
        for (i = 0; i < MLX5E_ETH_ADDR_HASH_SIZE; i++) \
                LIST_FOREACH_SAFE(hn, &(hash)[i], hlist, tmp)

static void
mlx5e_execute_action(struct mlx5e_priv *priv,
    struct mlx5e_eth_addr_hash_node *hn)
{
        switch (hn->action) {
        case MLX5E_ACTION_ADD:
                mlx5e_add_eth_addr_rule(priv, &hn->ai, MLX5E_FULLMATCH);
                hn->action = MLX5E_ACTION_NONE;
                break;

        case MLX5E_ACTION_DEL:
                mlx5e_del_eth_addr_from_flow_table(priv, &hn->ai);
                if (hn->mpfs_index != -1U)
                        mlx5_mpfs_del_mac(priv->mdev, hn->mpfs_index);
                mlx5e_del_eth_addr_from_hash(hn);
                break;

        default:
                break;
        }
}

static struct mlx5e_eth_addr_hash_node *
mlx5e_move_hn(struct mlx5e_eth_addr_hash_head *fh, struct mlx5e_eth_addr_hash_head *uh)
{
        struct mlx5e_eth_addr_hash_node *hn;

        hn = LIST_FIRST(fh);
        if (hn != NULL) {
                LIST_REMOVE(hn, hlist);
                LIST_INSERT_HEAD(uh, hn, hlist);
        }
        return (hn);
}

static struct mlx5e_eth_addr_hash_node *
mlx5e_remove_hn(struct mlx5e_eth_addr_hash_head *fh)
{
        struct mlx5e_eth_addr_hash_node *hn;

        hn = LIST_FIRST(fh);
        if (hn != NULL)
                LIST_REMOVE(hn, hlist);
        return (hn);
}

struct mlx5e_copy_addr_ctx {
        struct mlx5e_eth_addr_hash_head *free;
        struct mlx5e_eth_addr_hash_head *fill;
        bool success;
};

static u_int
mlx5e_copy_addr(void *arg, struct sockaddr_dl *sdl, u_int cnt)
{
        struct mlx5e_copy_addr_ctx *ctx = arg;
        struct mlx5e_eth_addr_hash_node *hn;

        hn = mlx5e_move_hn(ctx->free, ctx->fill);
        if (hn == NULL) {
                ctx->success = false;
                return (0);
        }
        ether_addr_copy(hn->ai.addr, LLADDR(sdl));

        return (1);
}

static void
mlx5e_sync_ifp_addr(struct mlx5e_priv *priv)
{
        struct mlx5e_copy_addr_ctx ctx;
        struct mlx5e_eth_addr_hash_head head_free;
        struct mlx5e_eth_addr_hash_head head_uc;
        struct mlx5e_eth_addr_hash_head head_mc;
        struct mlx5e_eth_addr_hash_node *hn;
        if_t ifp = priv->ifp;
        size_t x;
        size_t num;

        PRIV_ASSERT_LOCKED(priv);

retry:
        LIST_INIT(&head_free);
        LIST_INIT(&head_uc);
        LIST_INIT(&head_mc);
        num = 1 + if_lladdr_count(ifp) + if_llmaddr_count(ifp);

        /* allocate place holders */
        for (x = 0; x != num; x++) {
                hn = malloc(sizeof(*hn), M_MLX5EN, M_WAITOK | M_ZERO);
                hn->action = MLX5E_ACTION_ADD;
                hn->mpfs_index = -1U;
                LIST_INSERT_HEAD(&head_free, hn, hlist);
        }

        hn = mlx5e_move_hn(&head_free, &head_uc);
        MPASS(hn != NULL);

        ether_addr_copy(hn->ai.addr, if_getlladdr(ifp));

        ctx.free = &head_free;
        ctx.fill = &head_uc;
        ctx.success = true;
        if_foreach_lladdr(ifp, mlx5e_copy_addr, &ctx);
        if (ctx.success == false)
                goto cleanup;

        ctx.fill = &head_mc;
        if_foreach_llmaddr(ifp, mlx5e_copy_addr, &ctx);
        if (ctx.success == false)
                goto cleanup;

        /* insert L2 unicast addresses into hash list */

        while ((hn = mlx5e_remove_hn(&head_uc)) != NULL) {
                if (mlx5e_add_eth_addr_to_hash(priv->eth_addr.if_uc, hn) == 0)
                        continue;
                if (hn->mpfs_index == -1U)
                        mlx5_mpfs_add_mac(priv->mdev, &hn->mpfs_index,
                            hn->ai.addr, 0, 0);
        }

        /* insert L2 multicast addresses into hash list */

        while ((hn = mlx5e_remove_hn(&head_mc)) != NULL) {
                if (mlx5e_add_eth_addr_to_hash(priv->eth_addr.if_mc, hn) == 0)
                        continue;
        }

cleanup:
        while ((hn = mlx5e_remove_hn(&head_uc)) != NULL)
                free(hn, M_MLX5EN);
        while ((hn = mlx5e_remove_hn(&head_mc)) != NULL)
                free(hn, M_MLX5EN);
        while ((hn = mlx5e_remove_hn(&head_free)) != NULL)
                free(hn, M_MLX5EN);

        if (ctx.success == false)
                goto retry;
}

static void mlx5e_fill_addr_array(struct mlx5e_priv *priv, int list_type,
                                  u8 addr_array[][ETH_ALEN], int size)
{
        bool is_uc = (list_type == MLX5_NIC_VPORT_LIST_TYPE_UC);
        if_t ifp = priv->ifp;
        struct mlx5e_eth_addr_hash_node *hn;
        struct mlx5e_eth_addr_hash_head *addr_list;
        struct mlx5e_eth_addr_hash_node *tmp;
        int i = 0;
        int hi;

        addr_list = is_uc ? priv->eth_addr.if_uc : priv->eth_addr.if_mc;

        if (is_uc) /* Make sure our own address is pushed first */
                ether_addr_copy(addr_array[i++], if_getlladdr(ifp));
        else if (priv->eth_addr.broadcast_enabled)
                ether_addr_copy(addr_array[i++], if_getbroadcastaddr(ifp));

        mlx5e_for_each_hash_node(hn, tmp, addr_list, hi) {
                if (ether_addr_equal(if_getlladdr(ifp), hn->ai.addr))
                        continue;
                if (i >= size)
                        break;
                ether_addr_copy(addr_array[i++], hn->ai.addr);
        }
}

static void mlx5e_vport_context_update_addr_list(struct mlx5e_priv *priv,
                                                 int list_type)
{
        bool is_uc = (list_type == MLX5_NIC_VPORT_LIST_TYPE_UC);
        struct mlx5e_eth_addr_hash_node *hn;
        u8 (*addr_array)[ETH_ALEN] = NULL;
        struct mlx5e_eth_addr_hash_head *addr_list;
        struct mlx5e_eth_addr_hash_node *tmp;
        int max_size;
        int size;
        int err;
        int hi;

        size = is_uc ? 0 : (priv->eth_addr.broadcast_enabled ? 1 : 0);
        max_size = is_uc ?
                1 << MLX5_CAP_GEN(priv->mdev, log_max_current_uc_list) :
                1 << MLX5_CAP_GEN(priv->mdev, log_max_current_mc_list);

        addr_list = is_uc ? priv->eth_addr.if_uc : priv->eth_addr.if_mc;
        mlx5e_for_each_hash_node(hn, tmp, addr_list, hi)
                size++;

        if (size > max_size) {
                mlx5_en_err(priv->ifp,
                            "ifp %s list size (%d) > (%d) max vport list size, some addresses will be dropped\n",
                            is_uc ? "UC" : "MC", size, max_size);
                size = max_size;
        }

        if (size) {
                addr_array = kcalloc(size, ETH_ALEN, GFP_KERNEL);
                if (!addr_array) {
                        err = -ENOMEM;
                        goto out;
                }
                mlx5e_fill_addr_array(priv, list_type, addr_array, size);
        }

        err = mlx5_modify_nic_vport_mac_list(priv->mdev, list_type, addr_array, size);
out:
        if (err)
                mlx5_en_err(priv->ifp,
                           "Failed to modify vport %s list err(%d)\n",
                           is_uc ? "UC" : "MC", err);
        kfree(addr_array);
}

static void mlx5e_vport_context_update(struct mlx5e_priv *priv)
{
        struct mlx5e_eth_addr_db *ea = &priv->eth_addr;

        mlx5e_vport_context_update_addr_list(priv, MLX5_NIC_VPORT_LIST_TYPE_UC);
        mlx5e_vport_context_update_addr_list(priv, MLX5_NIC_VPORT_LIST_TYPE_MC);
        mlx5_modify_nic_vport_promisc(priv->mdev, 0,
                                      ea->allmulti_enabled,
                                      ea->promisc_enabled);
}

static void
mlx5e_apply_ifp_addr(struct mlx5e_priv *priv)
{
        struct mlx5e_eth_addr_hash_node *hn;
        struct mlx5e_eth_addr_hash_node *tmp;
        int i;

        mlx5e_for_each_hash_node(hn, tmp, priv->eth_addr.if_uc, i)
            mlx5e_execute_action(priv, hn);

        mlx5e_for_each_hash_node(hn, tmp, priv->eth_addr.if_mc, i)
            mlx5e_execute_action(priv, hn);
}

static void
mlx5e_handle_ifp_addr(struct mlx5e_priv *priv, bool rx_mode_enable)
{
        struct mlx5e_eth_addr_hash_node *hn;
        struct mlx5e_eth_addr_hash_node *tmp;
        int i;

        mlx5e_for_each_hash_node(hn, tmp, priv->eth_addr.if_uc, i)
            hn->action = MLX5E_ACTION_DEL;
        mlx5e_for_each_hash_node(hn, tmp, priv->eth_addr.if_mc, i)
            hn->action = MLX5E_ACTION_DEL;

        if (rx_mode_enable)
                mlx5e_sync_ifp_addr(priv);

        mlx5e_apply_ifp_addr(priv);
}

static void
mlx5e_set_rx_mode_core(struct mlx5e_priv *priv, bool rx_mode_enable)
{
        struct mlx5e_eth_addr_db *ea = &priv->eth_addr;
        if_t ndev = priv->ifp;
        int ndev_flags = if_getflags(ndev);

        bool promisc_enabled = rx_mode_enable && (ndev_flags & IFF_PROMISC);
        bool allmulti_enabled = rx_mode_enable && (ndev_flags & IFF_ALLMULTI);
        bool broadcast_enabled = rx_mode_enable;

        bool enable_promisc = !ea->promisc_enabled && promisc_enabled;
        bool disable_promisc = ea->promisc_enabled && !promisc_enabled;
        bool enable_allmulti = !ea->allmulti_enabled && allmulti_enabled;
        bool disable_allmulti = ea->allmulti_enabled && !allmulti_enabled;
        bool enable_broadcast = !ea->broadcast_enabled && broadcast_enabled;
        bool disable_broadcast = ea->broadcast_enabled && !broadcast_enabled;

        /* update broadcast address */
        ether_addr_copy(priv->eth_addr.broadcast.addr,
            if_getbroadcastaddr(priv->ifp));

        if (enable_promisc) {
                mlx5e_add_eth_addr_rule(priv, &ea->promisc, MLX5E_PROMISC);
                if (!priv->vlan.filter_disabled)
                        mlx5e_add_any_vid_rules(priv);
        }
        if (enable_allmulti)
                mlx5e_add_eth_addr_rule(priv, &ea->allmulti, MLX5E_ALLMULTI);
        if (enable_broadcast)
                mlx5e_add_eth_addr_rule(priv, &ea->broadcast, MLX5E_FULLMATCH);

        mlx5e_handle_ifp_addr(priv, rx_mode_enable);

        if (disable_broadcast)
                mlx5e_del_eth_addr_from_flow_table(priv, &ea->broadcast);
        if (disable_allmulti)
                mlx5e_del_eth_addr_from_flow_table(priv, &ea->allmulti);
        if (disable_promisc) {
                if (!priv->vlan.filter_disabled)
                        mlx5e_del_any_vid_rules(priv);
                mlx5e_del_eth_addr_from_flow_table(priv, &ea->promisc);
        }

        ea->promisc_enabled = promisc_enabled;
        ea->allmulti_enabled = allmulti_enabled;
        ea->broadcast_enabled = broadcast_enabled;

        mlx5e_vport_context_update(priv);
}

void
mlx5e_set_rx_mode_work(struct work_struct *work)
{
        struct mlx5e_priv *priv =
            container_of(work, struct mlx5e_priv, set_rx_mode_work);

        PRIV_LOCK(priv);
        if (test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                mlx5e_set_rx_mode_core(priv, true);
        PRIV_UNLOCK(priv);
}

static void
mlx5e_destroy_groups(struct mlx5e_flow_table *ft)
{
        int i;

        for (i = ft->num_groups - 1; i >= 0; i--) {
                if (!IS_ERR_OR_NULL(ft->g[i]))
                        mlx5_destroy_flow_group(ft->g[i]);
                ft->g[i] = NULL;
        }
        ft->num_groups = 0;
}

static void
mlx5e_destroy_flow_table(struct mlx5e_flow_table *ft)
{
        mlx5e_destroy_groups(ft);
        kfree(ft->g);
        mlx5_destroy_flow_table(ft->t);
        ft->t = NULL;
}

#define MLX5E_NUM_MAIN_GROUPS   10
#define MLX5E_MAIN_GROUP0_SIZE  BIT(4)
#define MLX5E_MAIN_GROUP1_SIZE  BIT(3)
#define MLX5E_MAIN_GROUP2_SIZE  BIT(1)
#define MLX5E_MAIN_GROUP3_SIZE  BIT(0)
#define MLX5E_MAIN_GROUP4_SIZE  BIT(14)
#define MLX5E_MAIN_GROUP5_SIZE  BIT(13)
#define MLX5E_MAIN_GROUP6_SIZE  BIT(11)
#define MLX5E_MAIN_GROUP7_SIZE  BIT(2)
#define MLX5E_MAIN_GROUP8_SIZE  BIT(1)
#define MLX5E_MAIN_GROUP9_SIZE  BIT(0)
#define MLX5E_MAIN_TABLE_SIZE   (MLX5E_MAIN_GROUP0_SIZE +\
                                 MLX5E_MAIN_GROUP1_SIZE +\
                                 MLX5E_MAIN_GROUP2_SIZE +\
                                 MLX5E_MAIN_GROUP3_SIZE +\
                                 MLX5E_MAIN_GROUP4_SIZE +\
                                 MLX5E_MAIN_GROUP5_SIZE +\
                                 MLX5E_MAIN_GROUP6_SIZE +\
                                 MLX5E_MAIN_GROUP7_SIZE +\
                                 MLX5E_MAIN_GROUP8_SIZE +\
                                 MLX5E_MAIN_GROUP9_SIZE +\
                                 0)

static int
mlx5e_create_main_groups_sub(struct mlx5e_flow_table *ft, u32 *in,
                                      int inlen)
{
        u8 *mc = MLX5_ADDR_OF(create_flow_group_in, in, match_criteria);
        u8 *dmac = MLX5_ADDR_OF(create_flow_group_in, in,
                                match_criteria.outer_headers.dmac_47_16);
        int err;
        int ix = 0;

        /* Tunnel rules need to be first in this list of groups */

        /* Start tunnel rules */
        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.udp_dport);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP0_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;
        /* End Tunnel Rules */

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP1_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP2_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP3_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        memset(dmac, 0xff, ETH_ALEN);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP4_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        memset(dmac, 0xff, ETH_ALEN);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP5_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        memset(dmac, 0xff, ETH_ALEN);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP6_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        dmac[0] = 0x01;
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP7_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        dmac[0] = 0x01;
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP8_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        dmac[0] = 0x01;
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_GROUP9_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        return (0);

err_destory_groups:
        err = PTR_ERR(ft->g[ft->num_groups]);
        ft->g[ft->num_groups] = NULL;
        mlx5e_destroy_groups(ft);

        return (err);
}

static int
mlx5e_create_main_groups(struct mlx5e_flow_table *ft)
{
        u32 *in;
        int inlen = MLX5_ST_SZ_BYTES(create_flow_group_in);
        int err;

        in = mlx5_vzalloc(inlen);
        if (!in)
                return (-ENOMEM);

        err = mlx5e_create_main_groups_sub(ft, in, inlen);

        kvfree(in);
        return (err);
}

#define MLX5E_MAIN_VXLAN_GROUP0_SIZE    BIT(3)
#define MLX5E_MAIN_VXLAN_GROUP1_SIZE    BIT(3)
#define MLX5E_MAIN_VXLAN_GROUP2_SIZE    BIT(0)
static int
mlx5e_create_main_vxlan_groups_sub(struct mlx5e_flow_table *ft, u32 *in,
    int inlen)
{
        u8 *mc = MLX5_ADDR_OF(create_flow_group_in, in, match_criteria);
        int err;
        int ix = 0;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_INNER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ip_protocol);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_VXLAN_GROUP0_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_INNER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ethertype);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_VXLAN_GROUP1_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_MAIN_VXLAN_GROUP2_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        return (0);

err_destory_groups:
        err = PTR_ERR(ft->g[ft->num_groups]);
        ft->g[ft->num_groups] = NULL;
        mlx5e_destroy_groups(ft);

        return (err);
}

static int
mlx5e_create_main_vxlan_groups(struct mlx5e_flow_table *ft)
{
        u32 *in;
        int inlen = MLX5_ST_SZ_BYTES(create_flow_group_in);
        int err;

        in = mlx5_vzalloc(inlen);
        if (!in)
                return (-ENOMEM);

        err = mlx5e_create_main_vxlan_groups_sub(ft, in, inlen);

        kvfree(in);
        return (err);
}


static int
mlx5e_create_main_flow_table(struct mlx5e_priv *priv, bool inner_vxlan)
{
        struct mlx5e_flow_table *ft = inner_vxlan ? &priv->fts.main_vxlan :
            &priv->fts.main;
        struct mlx5_flow_table_attr ft_attr = {};
        int err;

        ft->num_groups = 0;
        ft_attr.max_fte = MLX5E_MAIN_TABLE_SIZE;
        if (priv->ipsec)
                ft_attr.level = inner_vxlan ? 10 : 12;
        else
                ft_attr.level = inner_vxlan ? 2 : 4;
        ft->t = mlx5_create_flow_table(priv->fts.ns, &ft_attr);

        if (IS_ERR(ft->t)) {
                err = PTR_ERR(ft->t);
                ft->t = NULL;
                return (err);
        }
        ft->g = kcalloc(MLX5E_NUM_MAIN_GROUPS, sizeof(*ft->g), GFP_KERNEL);
        if (!ft->g) {
                err = -ENOMEM;
                goto err_destroy_main_flow_table;
        }

        err = inner_vxlan ? mlx5e_create_main_vxlan_groups(ft) :
            mlx5e_create_main_groups(ft);
        if (err)
                goto err_free_g;
        return (0);

err_free_g:
        kfree(ft->g);

err_destroy_main_flow_table:
        mlx5_destroy_flow_table(ft->t);
        ft->t = NULL;

        return (err);
}

static void mlx5e_destroy_main_flow_table(struct mlx5e_priv *priv)
{
        mlx5e_destroy_flow_table(&priv->fts.main);
}

static void mlx5e_destroy_main_vxlan_flow_table(struct mlx5e_priv *priv)
{
        mlx5e_destroy_flow_table(&priv->fts.main_vxlan);
}

#define MLX5E_NUM_VLAN_GROUPS   3
#define MLX5E_VLAN_GROUP0_SIZE  BIT(12)
#define MLX5E_VLAN_GROUP1_SIZE  BIT(1)
#define MLX5E_VLAN_GROUP2_SIZE  BIT(0)
#define MLX5E_VLAN_TABLE_SIZE   (MLX5E_VLAN_GROUP0_SIZE +\
                                 MLX5E_VLAN_GROUP1_SIZE +\
                                 MLX5E_VLAN_GROUP2_SIZE +\
                                 0)

static int
mlx5e_create_vlan_groups_sub(struct mlx5e_flow_table *ft, u32 *in,
                                      int inlen)
{
        int err;
        int ix = 0;
        u8 *mc = MLX5_ADDR_OF(create_flow_group_in, in, match_criteria);

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.cvlan_tag);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.first_vid);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_VLAN_GROUP0_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.cvlan_tag);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_VLAN_GROUP1_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.svlan_tag);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_VLAN_GROUP2_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        return (0);

err_destory_groups:
        err = PTR_ERR(ft->g[ft->num_groups]);
        ft->g[ft->num_groups] = NULL;
        mlx5e_destroy_groups(ft);

        return (err);
}

static int
mlx5e_create_vlan_groups(struct mlx5e_flow_table *ft)
{
        u32 *in;
        int inlen = MLX5_ST_SZ_BYTES(create_flow_group_in);
        int err;

        in = mlx5_vzalloc(inlen);
        if (!in)
                return (-ENOMEM);

        err = mlx5e_create_vlan_groups_sub(ft, in, inlen);

        kvfree(in);
        return (err);
}

static int
mlx5e_create_vlan_flow_table(struct mlx5e_priv *priv)
{
        struct mlx5e_flow_table *ft = &priv->fts.vlan;
        struct mlx5_flow_table_attr ft_attr = {};
        int err;

        ft->num_groups = 0;
        ft_attr.max_fte = MLX5E_VLAN_TABLE_SIZE;
        ft_attr.level = (priv->ipsec) ? 9 : 0;
        ft->t = mlx5_create_flow_table(priv->fts.ns, &ft_attr);

        if (IS_ERR(ft->t)) {
                err = PTR_ERR(ft->t);
                ft->t = NULL;
                return (err);
        }
        ft->g = kcalloc(MLX5E_NUM_VLAN_GROUPS, sizeof(*ft->g), GFP_KERNEL);
        if (!ft->g) {
                err = -ENOMEM;
                goto err_destroy_vlan_flow_table;
        }

        err = mlx5e_create_vlan_groups(ft);
        if (err)
                goto err_free_g;

        return (0);

err_free_g:
        kfree(ft->g);

err_destroy_vlan_flow_table:
        mlx5_destroy_flow_table(ft->t);
        ft->t = NULL;

        return (err);
}

static void
mlx5e_destroy_vlan_flow_table(struct mlx5e_priv *priv)
{
        mlx5e_destroy_flow_table(&priv->fts.vlan);
}

static int
mlx5e_add_vxlan_rule_sub(struct mlx5e_priv *priv, struct mlx5_flow_spec *spec,
    struct mlx5e_vxlan_db_el *el)
{
        struct mlx5_flow_table *ft = priv->fts.vxlan.t;
        struct mlx5_flow_destination dest = {};
        struct mlx5_flow_handle **rule_p;
        int err = 0;
        struct mlx5_flow_act flow_act = {
                .action = MLX5_FLOW_CONTEXT_ACTION_FWD_DEST,
        };
        u8 *mc;
        u8 *mv;

        mv = (u8 *)spec->match_value;
        mc = (u8 *)spec->match_criteria;

        spec->flow_context.flow_tag = MLX5_FS_ETH_FLOW_TAG;
        spec->flow_context.flags = FLOW_CONTEXT_HAS_TAG;

        dest.type = MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE;
        dest.ft = priv->fts.main_vxlan.t;

        spec->match_criteria_enable = MLX5_MATCH_OUTER_HEADERS;
        rule_p = &el->vxlan_ft_rule;
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET(fte_match_param, mv, outer_headers.ethertype, el->proto);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        MLX5_SET(fte_match_param, mv, outer_headers.ip_protocol, IPPROTO_UDP);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.udp_dport);
        MLX5_SET(fte_match_param, mv, outer_headers.udp_dport, el->port);

        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);

        if (IS_ERR(*rule_p)) {
                err = PTR_ERR(*rule_p);
                *rule_p = NULL;
                mlx5_en_err(priv->ifp, "add rule failed\n");
        }

        return (err);
}

static struct mlx5e_vxlan_db_el *
mlx5e_vxlan_find_db_el(struct mlx5e_priv *priv, u_int proto, u_int port)
{
        struct mlx5e_vxlan_db_el *el;

        TAILQ_FOREACH(el, &priv->vxlan.head, link) {
                if (el->proto == proto && el->port == port)
                        return (el);
        }
        return (NULL);
}

static struct mlx5e_vxlan_db_el *
mlx5e_vxlan_alloc_db_el(struct mlx5e_priv *priv, u_int proto, u_int port)
{
        struct mlx5e_vxlan_db_el *el;

        el = mlx5_vzalloc(sizeof(*el));
        el->refcount = 1;
        el->proto = proto;
        el->port = port;
        el->vxlan_ft_rule = NULL;
        return (el);
}

static int
mlx5e_vxlan_family_to_proto(sa_family_t family, u_int *proto)
{
        switch (family) {
        case AF_INET:
                *proto = ETHERTYPE_IP;
                return (0);
        case AF_INET6:
                *proto = ETHERTYPE_IPV6;
                return (0);
        default:
                return (-EINVAL);
        }
}

static int
mlx5e_add_vxlan_rule_from_db(struct mlx5e_priv *priv,
    struct mlx5e_vxlan_db_el *el)
{
        struct mlx5_flow_spec *spec;
        int err;

        spec = mlx5_vzalloc(sizeof(*spec));
        if (!spec) {
                mlx5_en_err(priv->ifp, "alloc failed\n");
                err = -ENOMEM;
                goto add_vxlan_rule_out;
        }

        err = mlx5e_add_vxlan_rule_sub(priv, spec, el);

add_vxlan_rule_out:
        kvfree(spec);

        return (err);
}

static int
mlx5e_add_vxlan_rule(struct mlx5e_priv *priv, sa_family_t family, u_int port)
{
        struct mlx5e_vxlan_db_el *el;
        u_int proto;
        int err;

        err = mlx5e_vxlan_family_to_proto(family, &proto);
        if (err != 0)
                return (err);

        el = mlx5e_vxlan_find_db_el(priv, proto, port);
        if (el != NULL) {
                el->refcount++;
                if (el->installed)
                        return (0);
        } else
                el = mlx5e_vxlan_alloc_db_el(priv, proto, port);

        if ((if_getcapenable(priv->ifp) & IFCAP_VXLAN_HWCSUM) != 0) {
                err = mlx5e_add_vxlan_rule_from_db(priv, el);
                if (err == 0)
                        el->installed = true;
        }
        if (err == 0)
                TAILQ_INSERT_TAIL(&priv->vxlan.head, el, link);
        else
                kvfree(el);

        return (err);
}

static int
mlx5e_add_vxlan_catchall_rule_sub(struct mlx5e_priv *priv,
                                  struct mlx5_flow_spec *spec)
{
        struct mlx5_flow_table *ft = priv->fts.vxlan.t;
        struct mlx5_flow_destination dest = {};
        struct mlx5_flow_handle **rule_p;
        int err = 0;
        struct mlx5_flow_act flow_act = {
                .action = MLX5_FLOW_CONTEXT_ACTION_FWD_DEST,
        };

        spec->flow_context.flow_tag = MLX5_FS_ETH_FLOW_TAG;
        spec->flow_context.flags = FLOW_CONTEXT_HAS_TAG;

        dest.type = MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE;
        dest.ft = priv->fts.main.t;

        rule_p = &priv->fts.vxlan_catchall_ft_rule;
        *rule_p = mlx5_add_flow_rules(ft, spec, &flow_act, &dest, 1);

        if (IS_ERR(*rule_p)) {
                err = PTR_ERR(*rule_p);
                *rule_p = NULL;
                mlx5_en_err(priv->ifp, "add rule failed\n");
        }

        return (err);
}


static int
mlx5e_add_vxlan_catchall_rule(struct mlx5e_priv *priv)
{
        struct mlx5_flow_spec *spec;
        int err;

        spec = mlx5_vzalloc(sizeof(*spec));
        if (!spec) {
                mlx5_en_err(priv->ifp, "alloc failed\n");
                err = -ENOMEM;
                goto add_vxlan_rule_out;
        }

        err = mlx5e_add_vxlan_catchall_rule_sub(priv, spec);

add_vxlan_rule_out:
        kvfree(spec);

        return (err);
}

int
mlx5e_add_all_vxlan_rules(struct mlx5e_priv *priv)
{
        struct mlx5e_vxlan_db_el *el;
        int err;

        err = 0;
        TAILQ_FOREACH(el, &priv->vxlan.head, link) {
                if (el->installed)
                        continue;
                err = mlx5e_add_vxlan_rule_from_db(priv, el);
                if (err != 0)
                        break;
                el->installed = true;
        }

        return (err);
}

static int
mlx5e_del_vxlan_rule(struct mlx5e_priv *priv, sa_family_t family, u_int port)
{
        struct mlx5e_vxlan_db_el *el;
        u_int proto;
        int err;

        err = mlx5e_vxlan_family_to_proto(family, &proto);
        if (err != 0)
                return (err);

        el = mlx5e_vxlan_find_db_el(priv, proto, port);
        if (el == NULL)
                return (0);
        if (el->refcount > 1) {
                el->refcount--;
                return (0);
        }

        if (el->installed)
                mlx5_del_flow_rules(&el->vxlan_ft_rule);
        TAILQ_REMOVE(&priv->vxlan.head, el, link);
        kvfree(el);
        return (0);
}

void
mlx5e_del_all_vxlan_rules(struct mlx5e_priv *priv)
{
        struct mlx5e_vxlan_db_el *el;

        TAILQ_FOREACH(el, &priv->vxlan.head, link) {
                if (!el->installed)
                        continue;
                mlx5_del_flow_rules(&el->vxlan_ft_rule);
                el->installed = false;
        }
}

static void
mlx5e_del_vxlan_catchall_rule(struct mlx5e_priv *priv)
{
        mlx5_del_flow_rules(&priv->fts.vxlan_catchall_ft_rule);
}

void
mlx5e_vxlan_start(void *arg, if_t ifp __unused, sa_family_t family,
    u_int port)
{
        struct mlx5e_priv *priv = arg;
        int err;

        PRIV_LOCK(priv);
        err = mlx5_vxlan_udp_port_add(priv->mdev, port);
        if (err == 0 && test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                mlx5e_add_vxlan_rule(priv, family, port);
        PRIV_UNLOCK(priv);
}

void
mlx5e_vxlan_stop(void *arg, if_t ifp __unused, sa_family_t family,
    u_int port)
{
        struct mlx5e_priv *priv = arg;

        PRIV_LOCK(priv);
        if (test_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state))
                mlx5e_del_vxlan_rule(priv, family, port);
        (void)mlx5_vxlan_udp_port_delete(priv->mdev, port);
        PRIV_UNLOCK(priv);
}

#define MLX5E_VXLAN_GROUP0_SIZE BIT(3)  /* XXXKIB */
#define MLX5E_VXLAN_GROUP1_SIZE BIT(0)
#define MLX5E_NUM_VXLAN_GROUPS  BIT(1)
#define MLX5E_VXLAN_TABLE_SIZE  \
    (MLX5E_VXLAN_GROUP0_SIZE + MLX5E_VXLAN_GROUP1_SIZE)

static int
mlx5e_create_vxlan_groups_sub(struct mlx5e_flow_table *ft, u32 *in,
                                      int inlen)
{
        int err;
        int ix = 0;
        u8 *mc = MLX5_ADDR_OF(create_flow_group_in, in, match_criteria);

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_OUTER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.ip_protocol);
        MLX5_SET_TO_ONES(fte_match_param, mc, outer_headers.udp_dport);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_VXLAN_GROUP0_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_VXLAN_GROUP1_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        return (0);

err_destory_groups:
        err = PTR_ERR(ft->g[ft->num_groups]);
        ft->g[ft->num_groups] = NULL;
        mlx5e_destroy_groups(ft);

        return (err);
}

static int
mlx5e_create_vxlan_groups(struct mlx5e_flow_table *ft)
{
        u32 *in;
        int inlen = MLX5_ST_SZ_BYTES(create_flow_group_in);
        int err;

        in = mlx5_vzalloc(inlen);
        if (!in)
                return (-ENOMEM);

        err = mlx5e_create_vxlan_groups_sub(ft, in, inlen);

        kvfree(in);
        return (err);
}

static int
mlx5e_create_vxlan_flow_table(struct mlx5e_priv *priv)
{
        struct mlx5e_flow_table *ft = &priv->fts.vxlan;
        struct mlx5_flow_table_attr ft_attr = {};
        int err;

        ft->num_groups = 0;
        ft_attr.max_fte = MLX5E_VXLAN_TABLE_SIZE;
        ft_attr.level = (priv->ipsec) ? 10 : 1;
        ft->t = mlx5_create_flow_table(priv->fts.ns, &ft_attr);

        if (IS_ERR(ft->t)) {
                err = PTR_ERR(ft->t);
                ft->t = NULL;
                return (err);
        }
        ft->g = kcalloc(MLX5E_NUM_VXLAN_GROUPS, sizeof(*ft->g), GFP_KERNEL);
        if (!ft->g) {
                err = -ENOMEM;
                goto err_destroy_vxlan_flow_table;
        }

        err = mlx5e_create_vxlan_groups(ft);
        if (err)
                goto err_free_g;

        TAILQ_INIT(&priv->vxlan.head);
        return (0);

err_free_g:
        kfree(ft->g);

err_destroy_vxlan_flow_table:
        mlx5_destroy_flow_table(ft->t);
        ft->t = NULL;

        return (err);
}

#define MLX5E_NUM_INNER_RSS_GROUPS      3
#define MLX5E_INNER_RSS_GROUP0_SIZE     BIT(3)
#define MLX5E_INNER_RSS_GROUP1_SIZE     BIT(1)
#define MLX5E_INNER_RSS_GROUP2_SIZE     BIT(0)
#define MLX5E_INNER_RSS_TABLE_SIZE      (MLX5E_INNER_RSS_GROUP0_SIZE +\
                                         MLX5E_INNER_RSS_GROUP1_SIZE +\
                                         MLX5E_INNER_RSS_GROUP2_SIZE +\
                                         0)

static int
mlx5e_create_inner_rss_groups_sub(struct mlx5e_flow_table *ft, u32 *in,
                                           int inlen)
{
        u8 *mc = MLX5_ADDR_OF(create_flow_group_in, in, match_criteria);
        int err;
        int ix = 0;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_INNER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ethertype);
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ip_protocol);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_INNER_RSS_GROUP0_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, match_criteria_enable, MLX5_MATCH_INNER_HEADERS);
        MLX5_SET_TO_ONES(fte_match_param, mc, inner_headers.ethertype);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_INNER_RSS_GROUP1_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        memset(in, 0, inlen);
        MLX5_SET_CFG(in, start_flow_index, ix);
        ix += MLX5E_INNER_RSS_GROUP2_SIZE;
        MLX5_SET_CFG(in, end_flow_index, ix - 1);
        ft->g[ft->num_groups] = mlx5_create_flow_group(ft->t, in);
        if (IS_ERR(ft->g[ft->num_groups]))
                goto err_destory_groups;
        ft->num_groups++;

        return (0);

err_destory_groups:
        err = PTR_ERR(ft->g[ft->num_groups]);
        ft->g[ft->num_groups] = NULL;
        mlx5e_destroy_groups(ft);

        return (err);
}

static int
mlx5e_create_inner_rss_groups(struct mlx5e_flow_table *ft)
{
        u32 *in;
        int inlen = MLX5_ST_SZ_BYTES(create_flow_group_in);
        int err;

        in = mlx5_vzalloc(inlen);
        if (!in)
                return (-ENOMEM);

        err = mlx5e_create_inner_rss_groups_sub(ft, in, inlen);

        kvfree(in);
        return (err);
}

static int
mlx5e_create_inner_rss_flow_table(struct mlx5e_priv *priv)
{
        struct mlx5e_flow_table *ft = &priv->fts.inner_rss;
        struct mlx5_flow_table_attr ft_attr = {};
        int err;

        ft->num_groups = 0;
        ft_attr.max_fte = MLX5E_INNER_RSS_TABLE_SIZE;
        ft_attr.level = (priv->ipsec) ? 11 : 3;
        ft->t = mlx5_create_flow_table(priv->fts.ns, &ft_attr);

        if (IS_ERR(ft->t)) {
                err = PTR_ERR(ft->t);
                ft->t = NULL;
                return (err);
        }
        ft->g = kcalloc(MLX5E_NUM_INNER_RSS_GROUPS, sizeof(*ft->g),
                        GFP_KERNEL);
        if (!ft->g) {
                err = -ENOMEM;
                goto err_destroy_inner_rss_flow_table;
        }

        err = mlx5e_create_inner_rss_groups(ft);
        if (err)
                goto err_free_g;

        return (0);

err_free_g:
        kfree(ft->g);

err_destroy_inner_rss_flow_table:
        mlx5_destroy_flow_table(ft->t);
        ft->t = NULL;

        return (err);
}

static void mlx5e_destroy_inner_rss_flow_table(struct mlx5e_priv *priv)
{
        mlx5e_destroy_flow_table(&priv->fts.inner_rss);
}

static void
mlx5e_destroy_vxlan_flow_table(struct mlx5e_priv *priv)
{
        mlx5e_destroy_flow_table(&priv->fts.vxlan);
}

int
mlx5e_open_flow_tables(struct mlx5e_priv *priv)
{
        int err;

        /* setup namespace pointer */
        priv->fts.ns = mlx5_get_flow_namespace(
            priv->mdev, MLX5_FLOW_NAMESPACE_KERNEL);

        err = mlx5e_accel_ipsec_fs_rx_tables_create(priv);
        if (err)
                return err;

        err = mlx5e_create_vlan_flow_table(priv);
        if (err)
                goto err_destroy_ipsec_flow_table;

        err = mlx5e_create_vxlan_flow_table(priv);
        if (err)
                goto err_destroy_vlan_flow_table;

        err = mlx5e_create_main_flow_table(priv, true);
        if (err)
                goto err_destroy_vxlan_flow_table;

        err = mlx5e_create_inner_rss_flow_table(priv);
        if (err)
                goto err_destroy_main_flow_table_true;

        err = mlx5e_create_main_flow_table(priv, false);
        if (err)
                goto err_destroy_inner_rss_flow_table;

        err = mlx5e_add_vxlan_catchall_rule(priv);
        if (err)
                goto err_destroy_main_flow_table_false;

        err = mlx5e_accel_ipsec_fs_rx_catchall_rules(priv);
        if (err)
                goto err_destroy_vxlan_catchall_rule;

        err = mlx5e_accel_fs_tcp_create(priv);
        if (err)
                goto err_destroy_ipsec_catchall_rules;

        return (0);

err_destroy_ipsec_catchall_rules:
        mlx5e_accel_ipsec_fs_rx_catchall_rules_destroy(priv);
err_destroy_vxlan_catchall_rule:
        mlx5e_del_vxlan_catchall_rule(priv);
err_destroy_main_flow_table_false:
        mlx5e_destroy_main_flow_table(priv);
err_destroy_inner_rss_flow_table:
        mlx5e_destroy_inner_rss_flow_table(priv);
err_destroy_main_flow_table_true:
        mlx5e_destroy_main_vxlan_flow_table(priv);
err_destroy_vxlan_flow_table:
        mlx5e_destroy_vxlan_flow_table(priv);
err_destroy_vlan_flow_table:
        mlx5e_destroy_vlan_flow_table(priv);
err_destroy_ipsec_flow_table:
        mlx5e_accel_ipsec_fs_rx_tables_destroy(priv);

        return (err);
}

void
mlx5e_close_flow_tables(struct mlx5e_priv *priv)
{
        mlx5e_accel_fs_tcp_destroy(priv);
        mlx5e_accel_ipsec_fs_rx_catchall_rules_destroy(priv);
        mlx5e_del_vxlan_catchall_rule(priv);
        mlx5e_destroy_main_flow_table(priv);
        mlx5e_destroy_inner_rss_flow_table(priv);
        mlx5e_destroy_main_vxlan_flow_table(priv);
        mlx5e_destroy_vxlan_flow_table(priv);
        mlx5e_destroy_vlan_flow_table(priv);
        mlx5e_accel_ipsec_fs_rx_tables_destroy(priv);
}

int
mlx5e_open_flow_rules(struct mlx5e_priv *priv)
{
        int err;

        err = mlx5e_add_all_vlan_rules(priv);
        if (err)
                return (err);

        err = mlx5e_add_main_vxlan_rules(priv);
        if (err)
                goto err_del_all_vlan_rules;

        err = mlx5e_add_all_vxlan_rules(priv);
        if (err)
                goto err_del_main_vxlan_rules;

        mlx5e_set_rx_mode_core(priv, true);

        set_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state);

        return (0);

err_del_main_vxlan_rules:
        mlx5e_del_main_vxlan_rules(priv);

err_del_all_vlan_rules:
        mlx5e_del_all_vlan_rules(priv);

        return (err);
}

void
mlx5e_close_flow_rules(struct mlx5e_priv *priv)
{
        clear_bit(MLX5E_STATE_FLOW_RULES_READY, &priv->state);

        mlx5e_set_rx_mode_core(priv, false);
        mlx5e_del_all_vxlan_rules(priv);
        mlx5e_del_main_vxlan_rules(priv);
        mlx5e_del_all_vlan_rules(priv);
}