2018-08-09 16:59:11 +08:00
|
|
|
// SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0
|
|
|
|
/* Copyright (c) 2016-2018 Mellanox Technologies. All rights reserved */
|
2016-07-02 17:00:15 +08:00
|
|
|
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/types.h>
|
2016-07-04 14:23:04 +08:00
|
|
|
#include <linux/rhashtable.h>
|
|
|
|
#include <linux/bitops.h>
|
|
|
|
#include <linux/in6.h>
|
2016-07-05 17:27:43 +08:00
|
|
|
#include <linux/notifier.h>
|
2017-02-08 21:36:49 +08:00
|
|
|
#include <linux/inetdevice.h>
|
2017-03-16 16:08:17 +08:00
|
|
|
#include <linux/netdevice.h>
|
2017-05-24 03:56:30 +08:00
|
|
|
#include <linux/if_bridge.h>
|
2017-07-24 15:56:00 +08:00
|
|
|
#include <linux/socket.h>
|
2017-08-03 19:28:28 +08:00
|
|
|
#include <linux/route.h>
|
2017-10-23 05:11:48 +08:00
|
|
|
#include <linux/gcd.h>
|
2018-07-14 16:39:52 +08:00
|
|
|
#include <linux/if_macvlan.h>
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
#include <linux/refcount.h>
|
2019-04-21 15:18:34 +08:00
|
|
|
#include <linux/jhash.h>
|
2019-10-03 17:49:32 +08:00
|
|
|
#include <linux/net_namespace.h>
|
2020-02-22 01:54:09 +08:00
|
|
|
#include <linux/mutex.h>
|
2016-07-05 17:27:43 +08:00
|
|
|
#include <net/netevent.h>
|
2016-07-05 17:27:39 +08:00
|
|
|
#include <net/neighbour.h>
|
|
|
|
#include <net/arp.h>
|
2016-09-26 18:52:31 +08:00
|
|
|
#include <net/ip_fib.h>
|
2017-08-03 19:28:27 +08:00
|
|
|
#include <net/ip6_fib.h>
|
2019-06-04 11:19:49 +08:00
|
|
|
#include <net/nexthop.h>
|
2017-03-16 16:08:14 +08:00
|
|
|
#include <net/fib_rules.h>
|
2017-09-03 05:49:19 +08:00
|
|
|
#include <net/ip_tunnels.h>
|
2017-03-16 16:08:16 +08:00
|
|
|
#include <net/l3mdev.h>
|
2017-07-18 16:10:13 +08:00
|
|
|
#include <net/addrconf.h>
|
2017-07-18 16:10:15 +08:00
|
|
|
#include <net/ndisc.h>
|
|
|
|
#include <net/ipv6.h>
|
2017-08-03 19:28:11 +08:00
|
|
|
#include <net/fib_notifier.h>
|
2018-07-14 16:39:52 +08:00
|
|
|
#include <net/switchdev.h>
|
2016-07-02 17:00:15 +08:00
|
|
|
|
|
|
|
#include "spectrum.h"
|
|
|
|
#include "core.h"
|
|
|
|
#include "reg.h"
|
2017-03-28 23:24:15 +08:00
|
|
|
#include "spectrum_cnt.h"
|
|
|
|
#include "spectrum_dpipe.h"
|
2017-09-03 05:49:17 +08:00
|
|
|
#include "spectrum_ipip.h"
|
2017-09-27 14:23:20 +08:00
|
|
|
#include "spectrum_mr.h"
|
|
|
|
#include "spectrum_mr_tcam.h"
|
2017-03-28 23:24:15 +08:00
|
|
|
#include "spectrum_router.h"
|
2018-02-27 21:53:46 +08:00
|
|
|
#include "spectrum_span.h"
|
2016-07-02 17:00:15 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_fib;
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_vr;
|
|
|
|
struct mlxsw_sp_lpm_tree;
|
2017-05-26 14:37:40 +08:00
|
|
|
struct mlxsw_sp_rif_ops;
|
2017-05-17 01:38:25 +08:00
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
struct mlxsw_sp_rif {
|
|
|
|
struct list_head nexthop_list;
|
|
|
|
struct list_head neigh_list;
|
2019-01-20 14:50:49 +08:00
|
|
|
struct net_device *dev; /* NULL for underlay RIF */
|
2017-05-26 14:37:39 +08:00
|
|
|
struct mlxsw_sp_fid *fid;
|
2017-03-10 15:53:39 +08:00
|
|
|
unsigned char addr[ETH_ALEN];
|
|
|
|
int mtu;
|
2017-03-17 16:38:00 +08:00
|
|
|
u16 rif_index;
|
2017-03-10 15:53:42 +08:00
|
|
|
u16 vr_id;
|
2017-05-26 14:37:40 +08:00
|
|
|
const struct mlxsw_sp_rif_ops *ops;
|
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
|
2017-03-28 23:24:15 +08:00
|
|
|
unsigned int counter_ingress;
|
|
|
|
bool counter_ingress_valid;
|
|
|
|
unsigned int counter_egress;
|
|
|
|
bool counter_egress_valid;
|
2017-03-10 15:53:39 +08:00
|
|
|
};
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
struct mlxsw_sp_rif_params {
|
|
|
|
struct net_device *dev;
|
|
|
|
union {
|
|
|
|
u16 system_port;
|
|
|
|
u16 lag_id;
|
|
|
|
};
|
|
|
|
u16 vid;
|
|
|
|
bool lag;
|
|
|
|
};
|
|
|
|
|
2017-05-26 14:37:34 +08:00
|
|
|
struct mlxsw_sp_rif_subport {
|
|
|
|
struct mlxsw_sp_rif common;
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
refcount_t ref_count;
|
2017-05-26 14:37:34 +08:00
|
|
|
union {
|
|
|
|
u16 system_port;
|
|
|
|
u16 lag_id;
|
|
|
|
};
|
|
|
|
u16 vid;
|
|
|
|
bool lag;
|
|
|
|
};
|
|
|
|
|
2017-09-03 05:49:19 +08:00
|
|
|
struct mlxsw_sp_rif_ipip_lb {
|
|
|
|
struct mlxsw_sp_rif common;
|
|
|
|
struct mlxsw_sp_rif_ipip_lb_config lb_config;
|
|
|
|
u16 ul_vr_id; /* Reserved for Spectrum-2. */
|
2019-01-20 14:50:47 +08:00
|
|
|
u16 ul_rif_id; /* Reserved for Spectrum. */
|
2017-09-03 05:49:19 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlxsw_sp_rif_params_ipip_lb {
|
|
|
|
struct mlxsw_sp_rif_params common;
|
|
|
|
struct mlxsw_sp_rif_ipip_lb_config lb_config;
|
|
|
|
};
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
struct mlxsw_sp_rif_ops {
|
|
|
|
enum mlxsw_sp_rif_type type;
|
|
|
|
size_t rif_size;
|
|
|
|
|
|
|
|
void (*setup)(struct mlxsw_sp_rif *rif,
|
|
|
|
const struct mlxsw_sp_rif_params *params);
|
|
|
|
int (*configure)(struct mlxsw_sp_rif *rif);
|
|
|
|
void (*deconfigure)(struct mlxsw_sp_rif *rif);
|
2018-06-25 15:48:13 +08:00
|
|
|
struct mlxsw_sp_fid * (*fid_get)(struct mlxsw_sp_rif *rif,
|
|
|
|
struct netlink_ext_ack *extack);
|
2018-07-14 16:39:52 +08:00
|
|
|
void (*fdb_del)(struct mlxsw_sp_rif *rif, const char *mac);
|
2017-05-26 14:37:40 +08:00
|
|
|
};
|
|
|
|
|
2020-02-20 15:07:59 +08:00
|
|
|
static struct mlxsw_sp_rif *
|
|
|
|
mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *dev);
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
static void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif);
|
2018-01-22 16:17:42 +08:00
|
|
|
static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree);
|
|
|
|
static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree);
|
|
|
|
static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct mlxsw_sp_fib *fib,
|
|
|
|
u8 tree_id);
|
|
|
|
static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct mlxsw_sp_fib *fib);
|
|
|
|
|
2017-03-28 23:24:15 +08:00
|
|
|
static unsigned int *
|
|
|
|
mlxsw_sp_rif_p_counter_get(struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir)
|
|
|
|
{
|
|
|
|
switch (dir) {
|
|
|
|
case MLXSW_SP_RIF_COUNTER_EGRESS:
|
|
|
|
return &rif->counter_egress;
|
|
|
|
case MLXSW_SP_RIF_COUNTER_INGRESS:
|
|
|
|
return &rif->counter_ingress;
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool
|
|
|
|
mlxsw_sp_rif_counter_valid_get(struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir)
|
|
|
|
{
|
|
|
|
switch (dir) {
|
|
|
|
case MLXSW_SP_RIF_COUNTER_EGRESS:
|
|
|
|
return rif->counter_egress_valid;
|
|
|
|
case MLXSW_SP_RIF_COUNTER_INGRESS:
|
|
|
|
return rif->counter_ingress_valid;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_rif_counter_valid_set(struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir,
|
|
|
|
bool valid)
|
|
|
|
{
|
|
|
|
switch (dir) {
|
|
|
|
case MLXSW_SP_RIF_COUNTER_EGRESS:
|
|
|
|
rif->counter_egress_valid = valid;
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_RIF_COUNTER_INGRESS:
|
|
|
|
rif->counter_ingress_valid = valid;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_counter_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
|
|
|
|
unsigned int counter_index, bool enable,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir)
|
|
|
|
{
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
bool is_egress = false;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (dir == MLXSW_SP_RIF_COUNTER_EGRESS)
|
|
|
|
is_egress = true;
|
|
|
|
mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
|
|
|
|
err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_counter_pack(ritr_pl, counter_index, enable,
|
|
|
|
is_egress);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
int mlxsw_sp_rif_counter_value_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir, u64 *cnt)
|
|
|
|
{
|
|
|
|
char ricnt_pl[MLXSW_REG_RICNT_LEN];
|
|
|
|
unsigned int *p_counter_index;
|
|
|
|
bool valid;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
valid = mlxsw_sp_rif_counter_valid_get(rif, dir);
|
|
|
|
if (!valid)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
|
|
|
|
if (!p_counter_index)
|
|
|
|
return -EINVAL;
|
|
|
|
mlxsw_reg_ricnt_pack(ricnt_pl, *p_counter_index,
|
|
|
|
MLXSW_REG_RICNT_OPCODE_NOP);
|
|
|
|
err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
*cnt = mlxsw_reg_ricnt_good_unicast_packets_get(ricnt_pl);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_counter_clear(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
unsigned int counter_index)
|
|
|
|
{
|
|
|
|
char ricnt_pl[MLXSW_REG_RICNT_LEN];
|
|
|
|
|
|
|
|
mlxsw_reg_ricnt_pack(ricnt_pl, counter_index,
|
|
|
|
MLXSW_REG_RICNT_OPCODE_CLEAR);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
int mlxsw_sp_rif_counter_alloc(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir)
|
|
|
|
{
|
|
|
|
unsigned int *p_counter_index;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
|
|
|
|
if (!p_counter_index)
|
|
|
|
return -EINVAL;
|
|
|
|
err = mlxsw_sp_counter_alloc(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
|
|
|
|
p_counter_index);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_counter_clear(mlxsw_sp, *p_counter_index);
|
|
|
|
if (err)
|
|
|
|
goto err_counter_clear;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index,
|
|
|
|
*p_counter_index, true, dir);
|
|
|
|
if (err)
|
|
|
|
goto err_counter_edit;
|
|
|
|
mlxsw_sp_rif_counter_valid_set(rif, dir, true);
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_counter_edit:
|
|
|
|
err_counter_clear:
|
|
|
|
mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
|
|
|
|
*p_counter_index);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
void mlxsw_sp_rif_counter_free(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_sp_rif_counter_dir dir)
|
|
|
|
{
|
|
|
|
unsigned int *p_counter_index;
|
|
|
|
|
2017-05-18 15:18:53 +08:00
|
|
|
if (!mlxsw_sp_rif_counter_valid_get(rif, dir))
|
|
|
|
return;
|
|
|
|
|
2017-03-28 23:24:15 +08:00
|
|
|
p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
|
|
|
|
if (WARN_ON(!p_counter_index))
|
|
|
|
return;
|
|
|
|
mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index,
|
|
|
|
*p_counter_index, false, dir);
|
|
|
|
mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
|
|
|
|
*p_counter_index);
|
|
|
|
mlxsw_sp_rif_counter_valid_set(rif, dir, false);
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static void mlxsw_sp_rif_counters_alloc(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct devlink *devlink;
|
|
|
|
|
|
|
|
devlink = priv_to_devlink(mlxsw_sp->core);
|
|
|
|
if (!devlink_dpipe_table_counter_enabled(devlink,
|
|
|
|
MLXSW_SP_DPIPE_TABLE_NAME_ERIF))
|
|
|
|
return;
|
|
|
|
mlxsw_sp_rif_counter_alloc(mlxsw_sp, rif, MLXSW_SP_RIF_COUNTER_EGRESS);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_rif_counters_free(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
|
|
|
|
mlxsw_sp_rif_counter_free(mlxsw_sp, rif, MLXSW_SP_RIF_COUNTER_EGRESS);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:30 +08:00
|
|
|
#define MLXSW_SP_PREFIX_COUNT (sizeof(struct in6_addr) * BITS_PER_BYTE + 1)
|
2017-05-17 01:38:25 +08:00
|
|
|
|
|
|
|
struct mlxsw_sp_prefix_usage {
|
|
|
|
DECLARE_BITMAP(b, MLXSW_SP_PREFIX_COUNT);
|
|
|
|
};
|
|
|
|
|
2016-07-04 14:23:08 +08:00
|
|
|
#define mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) \
|
|
|
|
for_each_set_bit(prefix, (prefix_usage)->b, MLXSW_SP_PREFIX_COUNT)
|
|
|
|
|
|
|
|
static bool
|
|
|
|
mlxsw_sp_prefix_usage_eq(struct mlxsw_sp_prefix_usage *prefix_usage1,
|
|
|
|
struct mlxsw_sp_prefix_usage *prefix_usage2)
|
|
|
|
{
|
|
|
|
return !memcmp(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1));
|
|
|
|
}
|
|
|
|
|
2016-07-04 14:23:09 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_prefix_usage_cpy(struct mlxsw_sp_prefix_usage *prefix_usage1,
|
|
|
|
struct mlxsw_sp_prefix_usage *prefix_usage2)
|
|
|
|
{
|
|
|
|
memcpy(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1));
|
|
|
|
}
|
|
|
|
|
2016-07-04 14:23:04 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_prefix_usage_set(struct mlxsw_sp_prefix_usage *prefix_usage,
|
|
|
|
unsigned char prefix_len)
|
|
|
|
{
|
|
|
|
set_bit(prefix_len, prefix_usage->b);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_prefix_usage_clear(struct mlxsw_sp_prefix_usage *prefix_usage,
|
|
|
|
unsigned char prefix_len)
|
|
|
|
{
|
|
|
|
clear_bit(prefix_len, prefix_usage->b);
|
|
|
|
}
|
|
|
|
|
|
|
|
struct mlxsw_sp_fib_key {
|
|
|
|
unsigned char addr[sizeof(struct in6_addr)];
|
|
|
|
unsigned char prefix_len;
|
|
|
|
};
|
|
|
|
|
2016-07-04 14:23:11 +08:00
|
|
|
enum mlxsw_sp_fib_entry_type {
|
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_REMOTE,
|
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_LOCAL,
|
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_TRAP,
|
2019-02-07 03:42:01 +08:00
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE,
|
2019-11-08 00:42:15 +08:00
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE,
|
2017-09-03 05:49:25 +08:00
|
|
|
|
|
|
|
/* This is a special case of local delivery, where a packet should be
|
|
|
|
* decapsulated on reception. Note that there is no corresponding ENCAP,
|
|
|
|
* because that's a type of next hop, not of FIB entry. (There can be
|
|
|
|
* several next hops in a REMOTE entry, and some of them may be
|
|
|
|
* encapsulating entries.)
|
|
|
|
*/
|
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP,
|
2018-10-17 16:53:07 +08:00
|
|
|
MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP,
|
2016-07-04 14:23:11 +08:00
|
|
|
};
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
struct mlxsw_sp_nexthop_group;
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib_entry;
|
2016-07-05 17:27:50 +08:00
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_node {
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
2016-09-26 18:52:31 +08:00
|
|
|
struct list_head list;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct rhash_head ht_node;
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib;
|
2016-07-04 14:23:04 +08:00
|
|
|
struct mlxsw_sp_fib_key key;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
};
|
|
|
|
|
2017-09-03 05:49:25 +08:00
|
|
|
struct mlxsw_sp_fib_entry_decap {
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
u32 tunnel_index;
|
|
|
|
};
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_entry {
|
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2016-07-04 14:23:11 +08:00
|
|
|
enum mlxsw_sp_fib_entry_type type;
|
2016-07-05 17:27:50 +08:00
|
|
|
struct list_head nexthop_group_node;
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_group;
|
2017-09-03 05:49:25 +08:00
|
|
|
struct mlxsw_sp_fib_entry_decap decap; /* Valid for decap entries. */
|
2016-07-04 14:23:04 +08:00
|
|
|
};
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
struct mlxsw_sp_fib4_entry {
|
|
|
|
struct mlxsw_sp_fib_entry common;
|
|
|
|
u32 tb_id;
|
|
|
|
u32 prio;
|
|
|
|
u8 tos;
|
|
|
|
u8 type;
|
|
|
|
};
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
struct mlxsw_sp_fib6_entry {
|
|
|
|
struct mlxsw_sp_fib_entry common;
|
|
|
|
struct list_head rt6_list;
|
|
|
|
unsigned int nrt6;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlxsw_sp_rt6 {
|
|
|
|
struct list_head list;
|
2018-04-18 08:33:26 +08:00
|
|
|
struct fib6_info *rt;
|
2017-08-03 19:28:28 +08:00
|
|
|
};
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_lpm_tree {
|
|
|
|
u8 id; /* tree ID */
|
|
|
|
unsigned int ref_count;
|
|
|
|
enum mlxsw_sp_l3proto proto;
|
2018-01-22 16:17:42 +08:00
|
|
|
unsigned long prefix_ref_count[MLXSW_SP_PREFIX_COUNT];
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_prefix_usage prefix_usage;
|
|
|
|
};
|
|
|
|
|
2016-07-04 14:23:04 +08:00
|
|
|
struct mlxsw_sp_fib {
|
|
|
|
struct rhashtable ht;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct list_head node_list;
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
|
|
|
enum mlxsw_sp_l3proto proto;
|
2016-07-04 14:23:04 +08:00
|
|
|
};
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_vr {
|
|
|
|
u16 id; /* virtual router ID */
|
|
|
|
u32 tb_id; /* kernel fib table id */
|
|
|
|
unsigned int rif_count;
|
|
|
|
struct mlxsw_sp_fib *fib4;
|
2017-07-18 16:10:22 +08:00
|
|
|
struct mlxsw_sp_fib *fib6;
|
2018-03-26 20:01:40 +08:00
|
|
|
struct mlxsw_sp_mr_table *mr_table[MLXSW_SP_L3_PROTO_MAX];
|
2019-01-20 14:50:51 +08:00
|
|
|
struct mlxsw_sp_rif *ul_rif;
|
|
|
|
refcount_t ul_rif_refcnt;
|
2017-05-17 01:38:25 +08:00
|
|
|
};
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
static const struct rhashtable_params mlxsw_sp_fib_ht_params;
|
2016-07-04 14:23:04 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
static struct mlxsw_sp_fib *mlxsw_sp_fib_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_vr *vr,
|
2017-03-10 15:53:41 +08:00
|
|
|
enum mlxsw_sp_l3proto proto)
|
2016-07-04 14:23:04 +08:00
|
|
|
{
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
2016-07-04 14:23:04 +08:00
|
|
|
struct mlxsw_sp_fib *fib;
|
|
|
|
int err;
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
lpm_tree = mlxsw_sp->router->lpm.proto_trees[proto];
|
2016-07-04 14:23:04 +08:00
|
|
|
fib = kzalloc(sizeof(*fib), GFP_KERNEL);
|
|
|
|
if (!fib)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
err = rhashtable_init(&fib->ht, &mlxsw_sp_fib_ht_params);
|
|
|
|
if (err)
|
|
|
|
goto err_rhashtable_init;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
INIT_LIST_HEAD(&fib->node_list);
|
2017-03-10 15:53:41 +08:00
|
|
|
fib->proto = proto;
|
|
|
|
fib->vr = vr;
|
2018-01-22 16:17:42 +08:00
|
|
|
fib->lpm_tree = lpm_tree;
|
|
|
|
mlxsw_sp_lpm_tree_hold(lpm_tree);
|
|
|
|
err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, lpm_tree->id);
|
|
|
|
if (err)
|
|
|
|
goto err_lpm_tree_bind;
|
2016-07-04 14:23:04 +08:00
|
|
|
return fib;
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
err_lpm_tree_bind:
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
|
2016-07-04 14:23:04 +08:00
|
|
|
err_rhashtable_init:
|
|
|
|
kfree(fib);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
static void mlxsw_sp_fib_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib *fib)
|
2016-07-04 14:23:04 +08:00
|
|
|
{
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_lpm_tree_unbind(mlxsw_sp, fib);
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, fib->lpm_tree);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
WARN_ON(!list_empty(&fib->node_list));
|
2016-07-04 14:23:04 +08:00
|
|
|
rhashtable_destroy(&fib->ht);
|
|
|
|
kfree(fib);
|
|
|
|
}
|
|
|
|
|
2016-07-04 14:23:08 +08:00
|
|
|
static struct mlxsw_sp_lpm_tree *
|
2017-03-10 15:53:40 +08:00
|
|
|
mlxsw_sp_lpm_tree_find_unused(struct mlxsw_sp *mlxsw_sp)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
|
|
|
static struct mlxsw_sp_lpm_tree *lpm_tree;
|
|
|
|
int i;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
|
|
|
|
lpm_tree = &mlxsw_sp->router->lpm.trees[i];
|
2017-03-10 15:53:40 +08:00
|
|
|
if (lpm_tree->ref_count == 0)
|
|
|
|
return lpm_tree;
|
2016-07-04 14:23:08 +08:00
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_lpm_tree_alloc(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree)
|
|
|
|
{
|
|
|
|
char ralta_pl[MLXSW_REG_RALTA_LEN];
|
|
|
|
|
2016-09-19 14:29:26 +08:00
|
|
|
mlxsw_reg_ralta_pack(ralta_pl, true,
|
|
|
|
(enum mlxsw_reg_ralxx_protocol) lpm_tree->proto,
|
|
|
|
lpm_tree->id);
|
2016-07-04 14:23:08 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
|
|
|
|
}
|
|
|
|
|
2017-08-14 16:54:03 +08:00
|
|
|
static void mlxsw_sp_lpm_tree_free(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
|
|
|
char ralta_pl[MLXSW_REG_RALTA_LEN];
|
|
|
|
|
2016-09-19 14:29:26 +08:00
|
|
|
mlxsw_reg_ralta_pack(ralta_pl, false,
|
|
|
|
(enum mlxsw_reg_ralxx_protocol) lpm_tree->proto,
|
|
|
|
lpm_tree->id);
|
2017-08-14 16:54:03 +08:00
|
|
|
mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
|
2016-07-04 14:23:08 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_lpm_tree_left_struct_set(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_prefix_usage *prefix_usage,
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree)
|
|
|
|
{
|
|
|
|
char ralst_pl[MLXSW_REG_RALST_LEN];
|
|
|
|
u8 root_bin = 0;
|
|
|
|
u8 prefix;
|
|
|
|
u8 last_prefix = MLXSW_REG_RALST_BIN_NO_CHILD;
|
|
|
|
|
|
|
|
mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage)
|
|
|
|
root_bin = prefix;
|
|
|
|
|
|
|
|
mlxsw_reg_ralst_pack(ralst_pl, root_bin, lpm_tree->id);
|
|
|
|
mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) {
|
|
|
|
if (prefix == 0)
|
|
|
|
continue;
|
|
|
|
mlxsw_reg_ralst_bin_pack(ralst_pl, prefix, last_prefix,
|
|
|
|
MLXSW_REG_RALST_BIN_NO_CHILD);
|
|
|
|
last_prefix = prefix;
|
|
|
|
}
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_lpm_tree *
|
|
|
|
mlxsw_sp_lpm_tree_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_prefix_usage *prefix_usage,
|
2017-03-10 15:53:40 +08:00
|
|
|
enum mlxsw_sp_l3proto proto)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
|
|
|
int err;
|
|
|
|
|
2017-03-10 15:53:40 +08:00
|
|
|
lpm_tree = mlxsw_sp_lpm_tree_find_unused(mlxsw_sp);
|
2016-07-04 14:23:08 +08:00
|
|
|
if (!lpm_tree)
|
|
|
|
return ERR_PTR(-EBUSY);
|
|
|
|
lpm_tree->proto = proto;
|
|
|
|
err = mlxsw_sp_lpm_tree_alloc(mlxsw_sp, lpm_tree);
|
|
|
|
if (err)
|
|
|
|
return ERR_PTR(err);
|
|
|
|
|
|
|
|
err = mlxsw_sp_lpm_tree_left_struct_set(mlxsw_sp, prefix_usage,
|
|
|
|
lpm_tree);
|
|
|
|
if (err)
|
|
|
|
goto err_left_struct_set;
|
2016-10-25 17:25:56 +08:00
|
|
|
memcpy(&lpm_tree->prefix_usage, prefix_usage,
|
|
|
|
sizeof(lpm_tree->prefix_usage));
|
2018-01-22 16:17:42 +08:00
|
|
|
memset(&lpm_tree->prefix_ref_count, 0,
|
|
|
|
sizeof(lpm_tree->prefix_ref_count));
|
|
|
|
lpm_tree->ref_count = 1;
|
2016-07-04 14:23:08 +08:00
|
|
|
return lpm_tree;
|
|
|
|
|
|
|
|
err_left_struct_set:
|
|
|
|
mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
2017-08-14 16:54:03 +08:00
|
|
|
static void mlxsw_sp_lpm_tree_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
2017-08-14 16:54:03 +08:00
|
|
|
mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree);
|
2016-07-04 14:23:08 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_lpm_tree *
|
|
|
|
mlxsw_sp_lpm_tree_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_prefix_usage *prefix_usage,
|
2017-03-10 15:53:40 +08:00
|
|
|
enum mlxsw_sp_l3proto proto)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
|
|
|
int i;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
|
|
|
|
lpm_tree = &mlxsw_sp->router->lpm.trees[i];
|
2016-10-25 17:25:57 +08:00
|
|
|
if (lpm_tree->ref_count != 0 &&
|
|
|
|
lpm_tree->proto == proto &&
|
2016-07-04 14:23:08 +08:00
|
|
|
mlxsw_sp_prefix_usage_eq(&lpm_tree->prefix_usage,
|
2018-01-22 16:17:42 +08:00
|
|
|
prefix_usage)) {
|
|
|
|
mlxsw_sp_lpm_tree_hold(lpm_tree);
|
2017-08-14 16:54:05 +08:00
|
|
|
return lpm_tree;
|
2018-01-22 16:17:42 +08:00
|
|
|
}
|
2016-07-04 14:23:08 +08:00
|
|
|
}
|
2017-08-14 16:54:05 +08:00
|
|
|
return mlxsw_sp_lpm_tree_create(mlxsw_sp, prefix_usage, proto);
|
|
|
|
}
|
2016-07-04 14:23:08 +08:00
|
|
|
|
2017-08-14 16:54:05 +08:00
|
|
|
static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree)
|
|
|
|
{
|
2016-07-04 14:23:08 +08:00
|
|
|
lpm_tree->ref_count++;
|
|
|
|
}
|
|
|
|
|
2017-08-14 16:54:03 +08:00
|
|
|
static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
|
|
|
if (--lpm_tree->ref_count == 0)
|
2017-08-14 16:54:03 +08:00
|
|
|
mlxsw_sp_lpm_tree_destroy(mlxsw_sp, lpm_tree);
|
2016-07-04 14:23:08 +08:00
|
|
|
}
|
|
|
|
|
2017-06-08 14:47:43 +08:00
|
|
|
#define MLXSW_SP_LPM_TREE_MIN 1 /* tree 0 is reserved */
|
2017-03-24 15:02:47 +08:00
|
|
|
|
|
|
|
static int mlxsw_sp_lpm_init(struct mlxsw_sp *mlxsw_sp)
|
2016-07-04 14:23:08 +08:00
|
|
|
{
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_prefix_usage req_prefix_usage = {{ 0 } };
|
2016-07-04 14:23:08 +08:00
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
2017-03-24 15:02:47 +08:00
|
|
|
u64 max_trees;
|
2018-01-22 16:17:42 +08:00
|
|
|
int err, i;
|
2016-07-04 14:23:08 +08:00
|
|
|
|
2017-03-24 15:02:47 +08:00
|
|
|
if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_LPM_TREES))
|
|
|
|
return -EIO;
|
|
|
|
|
|
|
|
max_trees = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_LPM_TREES);
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp->router->lpm.tree_count = max_trees - MLXSW_SP_LPM_TREE_MIN;
|
|
|
|
mlxsw_sp->router->lpm.trees = kcalloc(mlxsw_sp->router->lpm.tree_count,
|
2017-03-24 15:02:47 +08:00
|
|
|
sizeof(struct mlxsw_sp_lpm_tree),
|
|
|
|
GFP_KERNEL);
|
2017-05-17 01:38:25 +08:00
|
|
|
if (!mlxsw_sp->router->lpm.trees)
|
2017-03-24 15:02:47 +08:00
|
|
|
return -ENOMEM;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
|
|
|
|
lpm_tree = &mlxsw_sp->router->lpm.trees[i];
|
2016-07-04 14:23:08 +08:00
|
|
|
lpm_tree->id = i + MLXSW_SP_LPM_TREE_MIN;
|
|
|
|
}
|
2017-03-24 15:02:47 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV4);
|
|
|
|
if (IS_ERR(lpm_tree)) {
|
|
|
|
err = PTR_ERR(lpm_tree);
|
|
|
|
goto err_ipv4_tree_get;
|
|
|
|
}
|
|
|
|
mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4] = lpm_tree;
|
|
|
|
|
|
|
|
lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
if (IS_ERR(lpm_tree)) {
|
|
|
|
err = PTR_ERR(lpm_tree);
|
|
|
|
goto err_ipv6_tree_get;
|
|
|
|
}
|
|
|
|
mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV6] = lpm_tree;
|
|
|
|
|
2017-03-24 15:02:47 +08:00
|
|
|
return 0;
|
2018-01-22 16:17:42 +08:00
|
|
|
|
|
|
|
err_ipv6_tree_get:
|
|
|
|
lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4];
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
|
|
|
|
err_ipv4_tree_get:
|
|
|
|
kfree(mlxsw_sp->router->lpm.trees);
|
|
|
|
return err;
|
2017-03-24 15:02:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_lpm_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
|
|
|
|
|
|
|
lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV6];
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
|
|
|
|
|
|
|
|
lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4];
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
kfree(mlxsw_sp->router->lpm.trees);
|
2016-07-04 14:23:08 +08:00
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
static bool mlxsw_sp_vr_is_used(const struct mlxsw_sp_vr *vr)
|
|
|
|
{
|
2018-03-26 20:01:40 +08:00
|
|
|
return !!vr->fib4 || !!vr->fib6 ||
|
|
|
|
!!vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] ||
|
|
|
|
!!vr->mr_table[MLXSW_SP_L3_PROTO_IPV6];
|
2017-03-10 15:53:41 +08:00
|
|
|
}
|
|
|
|
|
2016-07-04 14:23:09 +08:00
|
|
|
static struct mlxsw_sp_vr *mlxsw_sp_vr_find_unused(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
int i;
|
|
|
|
|
2016-10-21 22:07:23 +08:00
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
|
2017-05-17 01:38:25 +08:00
|
|
|
vr = &mlxsw_sp->router->vrs[i];
|
2017-03-10 15:53:41 +08:00
|
|
|
if (!mlxsw_sp_vr_is_used(vr))
|
2016-07-04 14:23:09 +08:00
|
|
|
return vr;
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp,
|
2017-08-14 16:54:04 +08:00
|
|
|
const struct mlxsw_sp_fib *fib, u8 tree_id)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
|
|
|
char raltb_pl[MLXSW_REG_RALTB_LEN];
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id,
|
|
|
|
(enum mlxsw_reg_ralxx_protocol) fib->proto,
|
2017-08-14 16:54:04 +08:00
|
|
|
tree_id);
|
2016-07-04 14:23:09 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp,
|
2017-03-10 15:53:41 +08:00
|
|
|
const struct mlxsw_sp_fib *fib)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
|
|
|
char raltb_pl[MLXSW_REG_RALTB_LEN];
|
|
|
|
|
|
|
|
/* Bind to tree 0 which is default */
|
2017-03-10 15:53:41 +08:00
|
|
|
mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id,
|
|
|
|
(enum mlxsw_reg_ralxx_protocol) fib->proto, 0);
|
2016-07-04 14:23:09 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static u32 mlxsw_sp_fix_tb_id(u32 tb_id)
|
|
|
|
{
|
2017-09-27 14:23:19 +08:00
|
|
|
/* For our purpose, squash main, default and local tables into one */
|
|
|
|
if (tb_id == RT_TABLE_LOCAL || tb_id == RT_TABLE_DEFAULT)
|
2016-07-04 14:23:09 +08:00
|
|
|
tb_id = RT_TABLE_MAIN;
|
|
|
|
return tb_id;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_vr *mlxsw_sp_vr_find(struct mlxsw_sp *mlxsw_sp,
|
2017-03-10 15:53:41 +08:00
|
|
|
u32 tb_id)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
tb_id = mlxsw_sp_fix_tb_id(tb_id);
|
2016-09-20 17:16:54 +08:00
|
|
|
|
2016-10-21 22:07:23 +08:00
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
|
2017-05-17 01:38:25 +08:00
|
|
|
vr = &mlxsw_sp->router->vrs[i];
|
2017-03-10 15:53:41 +08:00
|
|
|
if (mlxsw_sp_vr_is_used(vr) && vr->tb_id == tb_id)
|
2016-07-04 14:23:09 +08:00
|
|
|
return vr;
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2018-10-17 16:53:08 +08:00
|
|
|
int mlxsw_sp_router_tb_id_vr_id(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
|
|
|
|
u16 *vr_id)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
|
|
|
|
if (!vr)
|
|
|
|
return -ESRCH;
|
|
|
|
*vr_id = vr->id;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
static struct mlxsw_sp_fib *mlxsw_sp_vr_fib(const struct mlxsw_sp_vr *vr,
|
|
|
|
enum mlxsw_sp_l3proto proto)
|
|
|
|
{
|
|
|
|
switch (proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
return vr->fib4;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
2017-07-18 16:10:22 +08:00
|
|
|
return vr->fib6;
|
2017-03-10 15:53:41 +08:00
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2016-07-04 14:23:09 +08:00
|
|
|
static struct mlxsw_sp_vr *mlxsw_sp_vr_create(struct mlxsw_sp *mlxsw_sp,
|
2017-10-19 00:56:56 +08:00
|
|
|
u32 tb_id,
|
|
|
|
struct netlink_ext_ack *extack)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
2018-03-26 20:01:40 +08:00
|
|
|
struct mlxsw_sp_mr_table *mr4_table, *mr6_table;
|
2018-02-13 18:22:42 +08:00
|
|
|
struct mlxsw_sp_fib *fib4;
|
|
|
|
struct mlxsw_sp_fib *fib6;
|
2016-07-04 14:23:09 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
2017-07-18 16:10:22 +08:00
|
|
|
int err;
|
2016-07-04 14:23:09 +08:00
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_find_unused(mlxsw_sp);
|
2017-10-19 00:56:56 +08:00
|
|
|
if (!vr) {
|
2018-02-13 18:29:05 +08:00
|
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported virtual routers");
|
2016-07-04 14:23:09 +08:00
|
|
|
return ERR_PTR(-EBUSY);
|
2017-10-19 00:56:56 +08:00
|
|
|
}
|
2018-02-13 18:22:42 +08:00
|
|
|
fib4 = mlxsw_sp_fib_create(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4);
|
|
|
|
if (IS_ERR(fib4))
|
|
|
|
return ERR_CAST(fib4);
|
|
|
|
fib6 = mlxsw_sp_fib_create(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
if (IS_ERR(fib6)) {
|
|
|
|
err = PTR_ERR(fib6);
|
2017-07-18 16:10:22 +08:00
|
|
|
goto err_fib6_create;
|
|
|
|
}
|
2018-02-13 18:22:42 +08:00
|
|
|
mr4_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV4);
|
|
|
|
if (IS_ERR(mr4_table)) {
|
|
|
|
err = PTR_ERR(mr4_table);
|
2018-03-26 20:01:40 +08:00
|
|
|
goto err_mr4_table_create;
|
2017-09-27 14:23:20 +08:00
|
|
|
}
|
2018-03-26 20:01:40 +08:00
|
|
|
mr6_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
if (IS_ERR(mr6_table)) {
|
|
|
|
err = PTR_ERR(mr6_table);
|
|
|
|
goto err_mr6_table_create;
|
|
|
|
}
|
|
|
|
|
2018-02-13 18:22:42 +08:00
|
|
|
vr->fib4 = fib4;
|
|
|
|
vr->fib6 = fib6;
|
2018-03-26 20:01:40 +08:00
|
|
|
vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] = mr4_table;
|
|
|
|
vr->mr_table[MLXSW_SP_L3_PROTO_IPV6] = mr6_table;
|
2016-07-04 14:23:09 +08:00
|
|
|
vr->tb_id = tb_id;
|
|
|
|
return vr;
|
2017-07-18 16:10:22 +08:00
|
|
|
|
2018-03-26 20:01:40 +08:00
|
|
|
err_mr6_table_create:
|
|
|
|
mlxsw_sp_mr_table_destroy(mr4_table);
|
|
|
|
err_mr4_table_create:
|
2018-02-13 18:22:42 +08:00
|
|
|
mlxsw_sp_fib_destroy(mlxsw_sp, fib6);
|
2017-07-18 16:10:22 +08:00
|
|
|
err_fib6_create:
|
2018-02-13 18:22:42 +08:00
|
|
|
mlxsw_sp_fib_destroy(mlxsw_sp, fib4);
|
2017-07-18 16:10:22 +08:00
|
|
|
return ERR_PTR(err);
|
2016-07-04 14:23:09 +08:00
|
|
|
}
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
static void mlxsw_sp_vr_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_vr *vr)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
2018-03-26 20:01:40 +08:00
|
|
|
mlxsw_sp_mr_table_destroy(vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]);
|
|
|
|
vr->mr_table[MLXSW_SP_L3_PROTO_IPV6] = NULL;
|
|
|
|
mlxsw_sp_mr_table_destroy(vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]);
|
|
|
|
vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] = NULL;
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_fib_destroy(mlxsw_sp, vr->fib6);
|
2017-07-18 16:10:22 +08:00
|
|
|
vr->fib6 = NULL;
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_fib_destroy(mlxsw_sp, vr->fib4);
|
2017-03-10 15:53:41 +08:00
|
|
|
vr->fib4 = NULL;
|
2016-07-04 14:23:09 +08:00
|
|
|
}
|
|
|
|
|
2017-10-19 00:56:56 +08:00
|
|
|
static struct mlxsw_sp_vr *mlxsw_sp_vr_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
|
|
|
|
struct netlink_ext_ack *extack)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
tb_id = mlxsw_sp_fix_tb_id(tb_id);
|
2017-03-10 15:53:41 +08:00
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
|
|
|
|
if (!vr)
|
2017-10-19 00:56:56 +08:00
|
|
|
vr = mlxsw_sp_vr_create(mlxsw_sp, tb_id, extack);
|
2016-07-04 14:23:09 +08:00
|
|
|
return vr;
|
|
|
|
}
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
static void mlxsw_sp_vr_put(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_vr *vr)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
2017-07-18 16:10:22 +08:00
|
|
|
if (!vr->rif_count && list_empty(&vr->fib4->node_list) &&
|
2017-09-27 14:23:20 +08:00
|
|
|
list_empty(&vr->fib6->node_list) &&
|
2018-03-26 20:01:40 +08:00
|
|
|
mlxsw_sp_mr_table_empty(vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]) &&
|
|
|
|
mlxsw_sp_mr_table_empty(vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]))
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_destroy(mlxsw_sp, vr);
|
2016-07-04 14:23:09 +08:00
|
|
|
}
|
|
|
|
|
2017-08-14 16:54:05 +08:00
|
|
|
static bool
|
|
|
|
mlxsw_sp_vr_lpm_tree_should_replace(struct mlxsw_sp_vr *vr,
|
|
|
|
enum mlxsw_sp_l3proto proto, u8 tree_id)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
|
|
|
|
|
|
|
|
if (!mlxsw_sp_vr_is_used(vr))
|
|
|
|
return false;
|
2018-01-22 16:17:42 +08:00
|
|
|
if (fib->lpm_tree->id == tree_id)
|
2017-08-14 16:54:05 +08:00
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_vr_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib *fib,
|
|
|
|
struct mlxsw_sp_lpm_tree *new_tree)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_lpm_tree *old_tree = fib->lpm_tree;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
fib->lpm_tree = new_tree;
|
|
|
|
mlxsw_sp_lpm_tree_hold(new_tree);
|
2018-01-18 22:42:10 +08:00
|
|
|
err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, new_tree->id);
|
|
|
|
if (err)
|
|
|
|
goto err_tree_bind;
|
2017-08-14 16:54:05 +08:00
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree);
|
|
|
|
return 0;
|
2018-01-18 22:42:10 +08:00
|
|
|
|
|
|
|
err_tree_bind:
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, new_tree);
|
|
|
|
fib->lpm_tree = old_tree;
|
|
|
|
return err;
|
2017-08-14 16:54:05 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_vrs_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib *fib,
|
|
|
|
struct mlxsw_sp_lpm_tree *new_tree)
|
|
|
|
{
|
|
|
|
enum mlxsw_sp_l3proto proto = fib->proto;
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_lpm_tree *old_tree;
|
2017-08-14 16:54:05 +08:00
|
|
|
u8 old_id, new_id = new_tree->id;
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
int i, err;
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
old_tree = mlxsw_sp->router->lpm.proto_trees[proto];
|
2017-08-14 16:54:05 +08:00
|
|
|
old_id = old_tree->id;
|
|
|
|
|
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
|
|
|
|
vr = &mlxsw_sp->router->vrs[i];
|
|
|
|
if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, old_id))
|
|
|
|
continue;
|
|
|
|
err = mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp,
|
|
|
|
mlxsw_sp_vr_fib(vr, proto),
|
|
|
|
new_tree);
|
|
|
|
if (err)
|
|
|
|
goto err_tree_replace;
|
|
|
|
}
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
memcpy(new_tree->prefix_ref_count, old_tree->prefix_ref_count,
|
|
|
|
sizeof(new_tree->prefix_ref_count));
|
|
|
|
mlxsw_sp->router->lpm.proto_trees[proto] = new_tree;
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree);
|
|
|
|
|
2017-08-14 16:54:05 +08:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_tree_replace:
|
|
|
|
for (i--; i >= 0; i--) {
|
|
|
|
if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, new_id))
|
|
|
|
continue;
|
|
|
|
mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp,
|
|
|
|
mlxsw_sp_vr_fib(vr, proto),
|
|
|
|
old_tree);
|
|
|
|
}
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2016-09-20 17:16:54 +08:00
|
|
|
static int mlxsw_sp_vrs_init(struct mlxsw_sp *mlxsw_sp)
|
2016-07-04 14:23:09 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_vr *vr;
|
2016-10-21 22:07:23 +08:00
|
|
|
u64 max_vrs;
|
2016-07-04 14:23:09 +08:00
|
|
|
int i;
|
|
|
|
|
2016-10-21 22:07:23 +08:00
|
|
|
if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_VRS))
|
2016-09-20 17:16:54 +08:00
|
|
|
return -EIO;
|
|
|
|
|
2016-10-21 22:07:23 +08:00
|
|
|
max_vrs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS);
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp->router->vrs = kcalloc(max_vrs, sizeof(struct mlxsw_sp_vr),
|
|
|
|
GFP_KERNEL);
|
|
|
|
if (!mlxsw_sp->router->vrs)
|
2016-09-20 17:16:54 +08:00
|
|
|
return -ENOMEM;
|
|
|
|
|
2016-10-21 22:07:23 +08:00
|
|
|
for (i = 0; i < max_vrs; i++) {
|
2017-05-17 01:38:25 +08:00
|
|
|
vr = &mlxsw_sp->router->vrs[i];
|
2016-07-04 14:23:09 +08:00
|
|
|
vr->id = i;
|
|
|
|
}
|
2016-09-20 17:16:54 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-11-14 18:26:32 +08:00
|
|
|
static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp);
|
|
|
|
|
2016-09-20 17:16:54 +08:00
|
|
|
static void mlxsw_sp_vrs_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2016-12-03 23:45:01 +08:00
|
|
|
/* At this stage we're guaranteed not to have new incoming
|
|
|
|
* FIB notifications and the work queue is free from FIBs
|
|
|
|
* sitting on top of mlxsw netdevs. However, we can still
|
|
|
|
* have other FIBs queued. Flush the queue before flushing
|
|
|
|
* the device's tables. No need for locks, as we're the only
|
|
|
|
* writer.
|
|
|
|
*/
|
|
|
|
mlxsw_core_flush_owq();
|
2016-11-14 18:26:32 +08:00
|
|
|
mlxsw_sp_router_fib_flush(mlxsw_sp);
|
2017-05-17 01:38:25 +08:00
|
|
|
kfree(mlxsw_sp->router->vrs);
|
2016-07-04 14:23:09 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:19 +08:00
|
|
|
static struct net_device *
|
|
|
|
__mlxsw_sp_ipip_netdev_ul_dev_get(const struct net_device *ol_dev)
|
|
|
|
{
|
|
|
|
struct ip_tunnel *tun = netdev_priv(ol_dev);
|
|
|
|
struct net *net = dev_net(ol_dev);
|
|
|
|
|
2020-02-20 15:07:55 +08:00
|
|
|
return dev_get_by_index_rcu(net, tun->parms.link);
|
2017-09-03 05:49:19 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:42 +08:00
|
|
|
u32 mlxsw_sp_ipip_dev_ul_tb_id(const struct net_device *ol_dev)
|
2017-09-03 05:49:19 +08:00
|
|
|
{
|
2020-02-20 15:07:55 +08:00
|
|
|
struct net_device *d;
|
|
|
|
u32 tb_id;
|
2017-09-03 05:49:19 +08:00
|
|
|
|
2020-02-20 15:07:55 +08:00
|
|
|
rcu_read_lock();
|
|
|
|
d = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
|
2017-09-03 05:49:19 +08:00
|
|
|
if (d)
|
2020-02-20 15:07:55 +08:00
|
|
|
tb_id = l3mdev_fib_table(d) ? : RT_TABLE_MAIN;
|
2017-09-03 05:49:19 +08:00
|
|
|
else
|
2020-02-20 15:07:55 +08:00
|
|
|
tb_id = RT_TABLE_MAIN;
|
|
|
|
rcu_read_unlock();
|
|
|
|
|
|
|
|
return tb_id;
|
2017-09-03 05:49:19 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:23 +08:00
|
|
|
static struct mlxsw_sp_rif *
|
|
|
|
mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp,
|
2017-10-19 00:56:56 +08:00
|
|
|
const struct mlxsw_sp_rif_params *params,
|
|
|
|
struct netlink_ext_ack *extack);
|
2017-09-03 05:49:23 +08:00
|
|
|
|
|
|
|
static struct mlxsw_sp_rif_ipip_lb *
|
|
|
|
mlxsw_sp_ipip_ol_ipip_lb_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
enum mlxsw_sp_ipip_type ipipt,
|
2017-11-03 17:03:36 +08:00
|
|
|
struct net_device *ol_dev,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-09-03 05:49:23 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_params_ipip_lb lb_params;
|
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt];
|
|
|
|
lb_params = (struct mlxsw_sp_rif_params_ipip_lb) {
|
|
|
|
.common.dev = ol_dev,
|
|
|
|
.common.lag = false,
|
|
|
|
.lb_config = ipip_ops->ol_loopback_config(mlxsw_sp, ol_dev),
|
|
|
|
};
|
|
|
|
|
2017-11-03 17:03:36 +08:00
|
|
|
rif = mlxsw_sp_rif_create(mlxsw_sp, &lb_params.common, extack);
|
2017-09-03 05:49:23 +08:00
|
|
|
if (IS_ERR(rif))
|
|
|
|
return ERR_CAST(rif);
|
|
|
|
return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_ipip_entry *
|
|
|
|
mlxsw_sp_ipip_entry_alloc(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
enum mlxsw_sp_ipip_type ipipt,
|
|
|
|
struct net_device *ol_dev)
|
|
|
|
{
|
2018-02-13 18:26:09 +08:00
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
2017-09-03 05:49:23 +08:00
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
struct mlxsw_sp_ipip_entry *ret = NULL;
|
|
|
|
|
2018-02-13 18:26:09 +08:00
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt];
|
2017-09-03 05:49:23 +08:00
|
|
|
ipip_entry = kzalloc(sizeof(*ipip_entry), GFP_KERNEL);
|
|
|
|
if (!ipip_entry)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
|
|
|
|
ipip_entry->ol_lb = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp, ipipt,
|
2017-11-03 17:03:36 +08:00
|
|
|
ol_dev, NULL);
|
2017-09-03 05:49:23 +08:00
|
|
|
if (IS_ERR(ipip_entry->ol_lb)) {
|
|
|
|
ret = ERR_CAST(ipip_entry->ol_lb);
|
|
|
|
goto err_ol_ipip_lb_create;
|
|
|
|
}
|
|
|
|
|
|
|
|
ipip_entry->ipipt = ipipt;
|
|
|
|
ipip_entry->ol_dev = ol_dev;
|
2018-02-13 18:26:09 +08:00
|
|
|
|
|
|
|
switch (ipip_ops->ul_proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
ipip_entry->parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
WARN_ON(1);
|
|
|
|
break;
|
|
|
|
}
|
2017-09-03 05:49:23 +08:00
|
|
|
|
|
|
|
return ipip_entry;
|
|
|
|
|
|
|
|
err_ol_ipip_lb_create:
|
|
|
|
kfree(ipip_entry);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2017-10-16 22:26:39 +08:00
|
|
|
mlxsw_sp_ipip_entry_dealloc(struct mlxsw_sp_ipip_entry *ipip_entry)
|
2017-09-03 05:49:23 +08:00
|
|
|
{
|
|
|
|
mlxsw_sp_rif_destroy(&ipip_entry->ol_lb->common);
|
|
|
|
kfree(ipip_entry);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool
|
|
|
|
mlxsw_sp_ipip_entry_saddr_matches(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
union mlxsw_sp_l3addr saddr,
|
|
|
|
u32 ul_tb_id,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
u32 tun_ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
|
|
|
|
enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt;
|
|
|
|
union mlxsw_sp_l3addr tun_saddr;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
tun_saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ipip_entry->ol_dev);
|
|
|
|
return tun_ul_tb_id == ul_tb_id &&
|
|
|
|
mlxsw_sp_l3addr_eq(&tun_saddr, &saddr);
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:25 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_fib_entry_decap_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
u32 tunnel_index;
|
|
|
|
int err;
|
|
|
|
|
2018-07-09 04:51:17 +08:00
|
|
|
err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
|
|
|
|
1, &tunnel_index);
|
2017-09-03 05:49:25 +08:00
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
ipip_entry->decap_fib_entry = fib_entry;
|
|
|
|
fib_entry->decap.ipip_entry = ipip_entry;
|
|
|
|
fib_entry->decap.tunnel_index = tunnel_index;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_fib_entry_decap_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
|
|
|
/* Unlink this node from the IPIP entry that it's the decap entry of. */
|
|
|
|
fib_entry->decap.ipip_entry->decap_fib_entry = NULL;
|
|
|
|
fib_entry->decap.ipip_entry = NULL;
|
2018-07-09 04:51:17 +08:00
|
|
|
mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
|
2018-07-09 04:51:18 +08:00
|
|
|
1, fib_entry->decap.tunnel_index);
|
2017-09-03 05:49:25 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:26 +08:00
|
|
|
static struct mlxsw_sp_fib_node *
|
|
|
|
mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr,
|
|
|
|
size_t addr_len, unsigned char prefix_len);
|
2017-09-03 05:49:25 +08:00
|
|
|
static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry);
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_ipip_entry_demote_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry = ipip_entry->decap_fib_entry;
|
|
|
|
|
|
|
|
mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, fib_entry);
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
|
|
|
|
|
|
|
|
mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:26 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_ipip_entry_promote_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
|
|
|
struct mlxsw_sp_fib_entry *decap_fib_entry)
|
|
|
|
{
|
|
|
|
if (mlxsw_sp_fib_entry_decap_init(mlxsw_sp, decap_fib_entry,
|
|
|
|
ipip_entry))
|
|
|
|
return;
|
|
|
|
decap_fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP;
|
|
|
|
|
|
|
|
if (mlxsw_sp_fib_entry_update(mlxsw_sp, decap_fib_entry))
|
|
|
|
mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
|
|
|
|
}
|
|
|
|
|
2018-10-17 16:53:07 +08:00
|
|
|
static struct mlxsw_sp_fib_entry *
|
|
|
|
mlxsw_sp_router_ip2me_fib_entry_find(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
|
|
|
|
enum mlxsw_sp_l3proto proto,
|
|
|
|
const union mlxsw_sp_l3addr *addr,
|
|
|
|
enum mlxsw_sp_fib_entry_type type)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
|
|
|
unsigned char addr_prefix_len;
|
|
|
|
struct mlxsw_sp_fib *fib;
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
const void *addrp;
|
|
|
|
size_t addr_len;
|
|
|
|
u32 addr4;
|
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
|
|
|
|
if (!vr)
|
|
|
|
return NULL;
|
|
|
|
fib = mlxsw_sp_vr_fib(vr, proto);
|
|
|
|
|
|
|
|
switch (proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
addr4 = be32_to_cpu(addr->addr4);
|
|
|
|
addrp = &addr4;
|
|
|
|
addr_len = 4;
|
|
|
|
addr_prefix_len = 32;
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6: /* fall through */
|
|
|
|
default:
|
|
|
|
WARN_ON(1);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
fib_node = mlxsw_sp_fib_node_lookup(fib, addrp, addr_len,
|
|
|
|
addr_prefix_len);
|
2019-12-27 00:41:17 +08:00
|
|
|
if (!fib_node || fib_node->fib_entry->type != type)
|
2018-10-17 16:53:07 +08:00
|
|
|
return NULL;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
return fib_node->fib_entry;
|
2018-10-17 16:53:07 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:26 +08:00
|
|
|
/* Given an IPIP entry, find the corresponding decap route. */
|
|
|
|
static struct mlxsw_sp_fib_entry *
|
|
|
|
mlxsw_sp_ipip_entry_find_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
static struct mlxsw_sp_fib_node *fib_node;
|
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
unsigned char saddr_prefix_len;
|
|
|
|
union mlxsw_sp_l3addr saddr;
|
|
|
|
struct mlxsw_sp_fib *ul_fib;
|
|
|
|
struct mlxsw_sp_vr *ul_vr;
|
|
|
|
const void *saddrp;
|
|
|
|
size_t saddr_len;
|
|
|
|
u32 ul_tb_id;
|
|
|
|
u32 saddr4;
|
|
|
|
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
|
|
|
|
|
|
|
|
ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
|
|
|
|
ul_vr = mlxsw_sp_vr_find(mlxsw_sp, ul_tb_id);
|
|
|
|
if (!ul_vr)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
ul_fib = mlxsw_sp_vr_fib(ul_vr, ipip_ops->ul_proto);
|
|
|
|
saddr = mlxsw_sp_ipip_netdev_saddr(ipip_ops->ul_proto,
|
|
|
|
ipip_entry->ol_dev);
|
|
|
|
|
|
|
|
switch (ipip_ops->ul_proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
saddr4 = be32_to_cpu(saddr.addr4);
|
|
|
|
saddrp = &saddr4;
|
|
|
|
saddr_len = 4;
|
|
|
|
saddr_prefix_len = 32;
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
WARN_ON(1);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
fib_node = mlxsw_sp_fib_node_lookup(ul_fib, saddrp, saddr_len,
|
|
|
|
saddr_prefix_len);
|
2019-12-27 00:41:17 +08:00
|
|
|
if (!fib_node ||
|
|
|
|
fib_node->fib_entry->type != MLXSW_SP_FIB_ENTRY_TYPE_TRAP)
|
2017-09-03 05:49:26 +08:00
|
|
|
return NULL;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
return fib_node->fib_entry;
|
2017-09-03 05:49:26 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:23 +08:00
|
|
|
static struct mlxsw_sp_ipip_entry *
|
2017-10-16 22:26:39 +08:00
|
|
|
mlxsw_sp_ipip_entry_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
enum mlxsw_sp_ipip_type ipipt,
|
|
|
|
struct net_device *ol_dev)
|
2017-09-03 05:49:23 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_alloc(mlxsw_sp, ipipt, ol_dev);
|
|
|
|
if (IS_ERR(ipip_entry))
|
|
|
|
return ipip_entry;
|
|
|
|
|
|
|
|
list_add_tail(&ipip_entry->ipip_list_node,
|
|
|
|
&mlxsw_sp->router->ipip_list);
|
|
|
|
|
|
|
|
return ipip_entry;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2017-10-16 22:26:39 +08:00
|
|
|
mlxsw_sp_ipip_entry_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
2017-09-03 05:49:23 +08:00
|
|
|
{
|
2017-10-16 22:26:39 +08:00
|
|
|
list_del(&ipip_entry->ipip_list_node);
|
|
|
|
mlxsw_sp_ipip_entry_dealloc(ipip_entry);
|
2017-09-03 05:49:23 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:25 +08:00
|
|
|
static bool
|
|
|
|
mlxsw_sp_ipip_entry_matches_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *ul_dev,
|
|
|
|
enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
union mlxsw_sp_l3addr ul_dip,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
u32 ul_tb_id = l3mdev_fib_table(ul_dev) ? : RT_TABLE_MAIN;
|
|
|
|
enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, ul_dip,
|
2018-12-07 01:44:52 +08:00
|
|
|
ul_tb_id, ipip_entry);
|
2017-09-03 05:49:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Given decap parameters, find the corresponding IPIP entry. */
|
|
|
|
static struct mlxsw_sp_ipip_entry *
|
|
|
|
mlxsw_sp_ipip_entry_find_by_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *ul_dev,
|
|
|
|
enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
union mlxsw_sp_l3addr ul_dip)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
|
|
|
|
ipip_list_node)
|
|
|
|
if (mlxsw_sp_ipip_entry_matches_decap(mlxsw_sp, ul_dev,
|
|
|
|
ul_proto, ul_dip,
|
|
|
|
ipip_entry))
|
|
|
|
return ipip_entry;
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2017-10-16 22:26:36 +08:00
|
|
|
static bool mlxsw_sp_netdev_ipip_type(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *dev,
|
|
|
|
enum mlxsw_sp_ipip_type *p_type)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_router *router = mlxsw_sp->router;
|
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
enum mlxsw_sp_ipip_type ipipt;
|
|
|
|
|
|
|
|
for (ipipt = 0; ipipt < MLXSW_SP_IPIP_TYPE_MAX; ++ipipt) {
|
|
|
|
ipip_ops = router->ipip_ops_arr[ipipt];
|
|
|
|
if (dev->type == ipip_ops->dev_type) {
|
|
|
|
if (p_type)
|
|
|
|
*p_type = ipipt;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:29 +08:00
|
|
|
bool mlxsw_sp_netdev_is_ipip_ol(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *dev)
|
2017-10-16 22:26:37 +08:00
|
|
|
{
|
|
|
|
return mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_ipip_entry *
|
|
|
|
mlxsw_sp_ipip_entry_find_by_ol_dev(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *ol_dev)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
|
|
|
|
ipip_list_node)
|
|
|
|
if (ipip_entry->ol_dev == ol_dev)
|
|
|
|
return ipip_entry;
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:41 +08:00
|
|
|
static struct mlxsw_sp_ipip_entry *
|
|
|
|
mlxsw_sp_ipip_entry_find_by_ul_dev(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *ul_dev,
|
|
|
|
struct mlxsw_sp_ipip_entry *start)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
ipip_entry = list_prepare_entry(start, &mlxsw_sp->router->ipip_list,
|
|
|
|
ipip_list_node);
|
|
|
|
list_for_each_entry_continue(ipip_entry, &mlxsw_sp->router->ipip_list,
|
|
|
|
ipip_list_node) {
|
2020-02-20 15:07:55 +08:00
|
|
|
struct net_device *ol_dev = ipip_entry->ol_dev;
|
|
|
|
struct net_device *ipip_ul_dev;
|
|
|
|
|
|
|
|
rcu_read_lock();
|
|
|
|
ipip_ul_dev = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
|
|
|
|
rcu_read_unlock();
|
2017-11-03 17:03:41 +08:00
|
|
|
|
|
|
|
if (ipip_ul_dev == ul_dev)
|
|
|
|
return ipip_entry;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
bool mlxsw_sp_netdev_is_ipip_ul(struct mlxsw_sp *mlxsw_sp,
|
2017-11-03 17:03:41 +08:00
|
|
|
const struct net_device *dev)
|
|
|
|
{
|
2020-02-22 01:54:12 +08:00
|
|
|
bool is_ipip_ul;
|
|
|
|
|
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
|
|
|
is_ipip_ul = mlxsw_sp_ipip_entry_find_by_ul_dev(mlxsw_sp, dev, NULL);
|
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
|
|
|
|
|
|
|
return is_ipip_ul;
|
2017-11-03 17:03:41 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:30 +08:00
|
|
|
static bool mlxsw_sp_netdevice_ipip_can_offload(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *ol_dev,
|
|
|
|
enum mlxsw_sp_ipip_type ipipt)
|
|
|
|
{
|
|
|
|
const struct mlxsw_sp_ipip_ops *ops
|
|
|
|
= mlxsw_sp->router->ipip_ops_arr[ipipt];
|
|
|
|
|
|
|
|
/* For deciding whether decap should be offloaded, we don't care about
|
|
|
|
* overlay protocol, so ask whether either one is supported.
|
|
|
|
*/
|
|
|
|
return ops->can_offload(mlxsw_sp, ol_dev, MLXSW_SP_L3_PROTO_IPV4) ||
|
|
|
|
ops->can_offload(mlxsw_sp, ol_dev, MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:29 +08:00
|
|
|
static int mlxsw_sp_netdevice_ipip_ol_reg_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev)
|
2017-10-16 22:26:37 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
mlxsw: spectrum_router: Onload conflicting tunnels
The approach for offloading IP tunnels implemented currently by mlxsw
doesn't allow two tunnels that have the same local IP address in the
same (underlay) VRF. Previously, offloads were introduced on demand as
encap routes were formed. When such a route was created that would cause
offload of a conflicting tunnel, mlxsw_sp_ipip_entry_create() would
detect it and return -EEXIST, which would propagate up and cause FIB
abort.
Now however IPIP entries are created as soon as an offloadable netdevice
is created, and the failure prevents creation of such device.
Furthermore, if the driver is installed at the point where such
conflicting tunnels exist, the failure actually prevents successful
modprobe.
Furthermore, follow-up patches implement handling of NETDEV_CHANGE due
to the local address change. However, NETDEV_CHANGE can't be vetoed. The
failure merely means that the offloads weren't updated, but the change
in Linux configuration is not rolled back. It is thus desirable to have
a robust way of handling these conflicts, which can later be reused for
handling NETDEV_CHANGE as well.
To fix this, when a conflicting tunnel is created, instead of failing,
simply pull the old tunnel to slow path and reject offloading the
new one.
Introduce two functions: mlxsw_sp_ipip_entry_demote_tunnel() and
mlxsw_sp_ipip_demote_tunnel_by_saddr() to handle this. Make them both
public, because they will be useful later on in this patchset.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-11-03 17:03:40 +08:00
|
|
|
enum mlxsw_sp_l3proto ul_proto;
|
2017-10-16 22:26:37 +08:00
|
|
|
enum mlxsw_sp_ipip_type ipipt;
|
mlxsw: spectrum_router: Onload conflicting tunnels
The approach for offloading IP tunnels implemented currently by mlxsw
doesn't allow two tunnels that have the same local IP address in the
same (underlay) VRF. Previously, offloads were introduced on demand as
encap routes were formed. When such a route was created that would cause
offload of a conflicting tunnel, mlxsw_sp_ipip_entry_create() would
detect it and return -EEXIST, which would propagate up and cause FIB
abort.
Now however IPIP entries are created as soon as an offloadable netdevice
is created, and the failure prevents creation of such device.
Furthermore, if the driver is installed at the point where such
conflicting tunnels exist, the failure actually prevents successful
modprobe.
Furthermore, follow-up patches implement handling of NETDEV_CHANGE due
to the local address change. However, NETDEV_CHANGE can't be vetoed. The
failure merely means that the offloads weren't updated, but the change
in Linux configuration is not rolled back. It is thus desirable to have
a robust way of handling these conflicts, which can later be reused for
handling NETDEV_CHANGE as well.
To fix this, when a conflicting tunnel is created, instead of failing,
simply pull the old tunnel to slow path and reject offloading the
new one.
Introduce two functions: mlxsw_sp_ipip_entry_demote_tunnel() and
mlxsw_sp_ipip_demote_tunnel_by_saddr() to handle this. Make them both
public, because they will be useful later on in this patchset.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-11-03 17:03:40 +08:00
|
|
|
union mlxsw_sp_l3addr saddr;
|
|
|
|
u32 ul_tb_id;
|
2017-10-16 22:26:37 +08:00
|
|
|
|
|
|
|
mlxsw_sp_netdev_ipip_type(mlxsw_sp, ol_dev, &ipipt);
|
2017-11-03 17:03:30 +08:00
|
|
|
if (mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev, ipipt)) {
|
mlxsw: spectrum_router: Onload conflicting tunnels
The approach for offloading IP tunnels implemented currently by mlxsw
doesn't allow two tunnels that have the same local IP address in the
same (underlay) VRF. Previously, offloads were introduced on demand as
encap routes were formed. When such a route was created that would cause
offload of a conflicting tunnel, mlxsw_sp_ipip_entry_create() would
detect it and return -EEXIST, which would propagate up and cause FIB
abort.
Now however IPIP entries are created as soon as an offloadable netdevice
is created, and the failure prevents creation of such device.
Furthermore, if the driver is installed at the point where such
conflicting tunnels exist, the failure actually prevents successful
modprobe.
Furthermore, follow-up patches implement handling of NETDEV_CHANGE due
to the local address change. However, NETDEV_CHANGE can't be vetoed. The
failure merely means that the offloads weren't updated, but the change
in Linux configuration is not rolled back. It is thus desirable to have
a robust way of handling these conflicts, which can later be reused for
handling NETDEV_CHANGE as well.
To fix this, when a conflicting tunnel is created, instead of failing,
simply pull the old tunnel to slow path and reject offloading the
new one.
Introduce two functions: mlxsw_sp_ipip_entry_demote_tunnel() and
mlxsw_sp_ipip_demote_tunnel_by_saddr() to handle this. Make them both
public, because they will be useful later on in this patchset.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-11-03 17:03:40 +08:00
|
|
|
ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ol_dev);
|
|
|
|
ul_proto = mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto;
|
|
|
|
saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ol_dev);
|
|
|
|
if (!mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, ul_proto,
|
|
|
|
saddr, ul_tb_id,
|
|
|
|
NULL)) {
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_create(mlxsw_sp, ipipt,
|
|
|
|
ol_dev);
|
|
|
|
if (IS_ERR(ipip_entry))
|
|
|
|
return PTR_ERR(ipip_entry);
|
|
|
|
}
|
2017-10-16 22:26:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:29 +08:00
|
|
|
static void mlxsw_sp_netdevice_ipip_ol_unreg_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev)
|
2017-10-16 22:26:37 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
|
|
|
|
if (ipip_entry)
|
2017-10-16 22:26:39 +08:00
|
|
|
mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry);
|
2017-10-16 22:26:37 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:35 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_ipip_entry_ol_up_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_entry *decap_fib_entry;
|
|
|
|
|
|
|
|
decap_fib_entry = mlxsw_sp_ipip_entry_find_decap(mlxsw_sp, ipip_entry);
|
|
|
|
if (decap_fib_entry)
|
|
|
|
mlxsw_sp_ipip_entry_promote_decap(mlxsw_sp, ipip_entry,
|
|
|
|
decap_fib_entry);
|
|
|
|
}
|
|
|
|
|
2018-03-23 01:53:34 +08:00
|
|
|
static int
|
2019-01-20 14:50:42 +08:00
|
|
|
mlxsw_sp_rif_ipip_lb_op(struct mlxsw_sp_rif_ipip_lb *lb_rif, u16 ul_vr_id,
|
|
|
|
u16 ul_rif_id, bool enable)
|
2018-03-23 01:53:34 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_ipip_lb_config lb_cf = lb_rif->lb_config;
|
|
|
|
struct mlxsw_sp_rif *rif = &lb_rif->common;
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
u32 saddr4;
|
|
|
|
|
|
|
|
switch (lb_cf.ul_protocol) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
saddr4 = be32_to_cpu(lb_cf.saddr.addr4);
|
|
|
|
mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF,
|
|
|
|
rif->rif_index, rif->vr_id, rif->dev->mtu);
|
|
|
|
mlxsw_reg_ritr_loopback_ipip4_pack(ritr_pl, lb_cf.lb_ipipt,
|
|
|
|
MLXSW_REG_RITR_LOOPBACK_IPIP_OPTIONS_GRE_KEY_PRESET,
|
2019-01-20 14:50:42 +08:00
|
|
|
ul_vr_id, ul_rif_id, saddr4, lb_cf.okey);
|
2018-03-23 01:53:34 +08:00
|
|
|
break;
|
|
|
|
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
return -EAFNOSUPPORT;
|
|
|
|
}
|
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
2018-03-23 01:53:35 +08:00
|
|
|
static int mlxsw_sp_netdevice_ipip_ol_update_mtu(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
struct mlxsw_sp_rif_ipip_lb *lb_rif;
|
|
|
|
int err = 0;
|
|
|
|
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
|
|
|
|
if (ipip_entry) {
|
|
|
|
lb_rif = ipip_entry->ol_lb;
|
2019-01-20 14:50:47 +08:00
|
|
|
err = mlxsw_sp_rif_ipip_lb_op(lb_rif, lb_rif->ul_vr_id,
|
|
|
|
lb_rif->ul_rif_id, true);
|
2018-03-23 01:53:35 +08:00
|
|
|
if (err)
|
|
|
|
goto out;
|
|
|
|
lb_rif->common.mtu = ol_dev->mtu;
|
|
|
|
}
|
|
|
|
|
|
|
|
out:
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:34 +08:00
|
|
|
static void mlxsw_sp_netdevice_ipip_ol_up_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev)
|
2017-10-16 22:26:37 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
|
2017-11-03 17:03:35 +08:00
|
|
|
if (ipip_entry)
|
|
|
|
mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry);
|
2017-10-16 22:26:37 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:33 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_ipip_entry_ol_down_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
if (ipip_entry->decap_fib_entry)
|
|
|
|
mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:29 +08:00
|
|
|
static void mlxsw_sp_netdevice_ipip_ol_down_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev)
|
2017-10-16 22:26:37 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
|
2017-11-03 17:03:33 +08:00
|
|
|
if (ipip_entry)
|
|
|
|
mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry);
|
2017-10-16 22:26:37 +08:00
|
|
|
}
|
|
|
|
|
2017-11-28 20:17:14 +08:00
|
|
|
static void mlxsw_sp_nexthop_rif_migrate(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *old_rif,
|
|
|
|
struct mlxsw_sp_rif *new_rif);
|
2017-11-03 17:03:37 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_ipip_entry_ol_lb_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
2017-11-03 17:03:38 +08:00
|
|
|
bool keep_encap,
|
2017-11-03 17:03:37 +08:00
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_ipip_lb *old_lb_rif = ipip_entry->ol_lb;
|
|
|
|
struct mlxsw_sp_rif_ipip_lb *new_lb_rif;
|
|
|
|
|
|
|
|
new_lb_rif = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp,
|
|
|
|
ipip_entry->ipipt,
|
|
|
|
ipip_entry->ol_dev,
|
|
|
|
extack);
|
|
|
|
if (IS_ERR(new_lb_rif))
|
|
|
|
return PTR_ERR(new_lb_rif);
|
|
|
|
ipip_entry->ol_lb = new_lb_rif;
|
2017-11-03 17:03:38 +08:00
|
|
|
|
2017-11-28 20:17:14 +08:00
|
|
|
if (keep_encap)
|
|
|
|
mlxsw_sp_nexthop_rif_migrate(mlxsw_sp, &old_lb_rif->common,
|
|
|
|
&new_lb_rif->common);
|
2017-11-03 17:03:38 +08:00
|
|
|
|
2017-11-03 17:03:37 +08:00
|
|
|
mlxsw_sp_rif_destroy(&old_lb_rif->common);
|
2017-10-16 22:26:38 +08:00
|
|
|
|
2017-11-03 17:03:37 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-11-28 20:17:14 +08:00
|
|
|
static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *rif);
|
|
|
|
|
2017-11-03 17:03:38 +08:00
|
|
|
/**
|
|
|
|
* Update the offload related to an IPIP entry. This always updates decap, and
|
|
|
|
* in addition to that it also:
|
|
|
|
* @recreate_loopback: recreates the associated loopback RIF
|
|
|
|
* @keep_encap: updates next hops that use the tunnel netdevice. This is only
|
|
|
|
* relevant when recreate_loopback is true.
|
|
|
|
* @update_nexthops: updates next hops, keeping the current loopback RIF. This
|
|
|
|
* is only relevant when recreate_loopback is false.
|
|
|
|
*/
|
2017-11-03 17:03:37 +08:00
|
|
|
int __mlxsw_sp_ipip_entry_update_tunnel(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
2017-11-03 17:03:38 +08:00
|
|
|
bool recreate_loopback,
|
|
|
|
bool keep_encap,
|
|
|
|
bool update_nexthops,
|
2017-11-03 17:03:37 +08:00
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
int err;
|
2017-10-16 22:26:38 +08:00
|
|
|
|
2017-11-03 17:03:37 +08:00
|
|
|
/* RIFs can't be edited, so to update loopback, we need to destroy and
|
|
|
|
* recreate it. That creates a window of opportunity where RALUE and
|
|
|
|
* RATR registers end up referencing a RIF that's already gone. RATRs
|
|
|
|
* are handled in mlxsw_sp_ipip_entry_ol_lb_update(), and to take care
|
2017-10-16 22:26:38 +08:00
|
|
|
* of RALUE, demote the decap route back.
|
|
|
|
*/
|
|
|
|
if (ipip_entry->decap_fib_entry)
|
|
|
|
mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
|
|
|
|
|
2017-11-03 17:03:38 +08:00
|
|
|
if (recreate_loopback) {
|
|
|
|
err = mlxsw_sp_ipip_entry_ol_lb_update(mlxsw_sp, ipip_entry,
|
|
|
|
keep_encap, extack);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
} else if (update_nexthops) {
|
|
|
|
mlxsw_sp_nexthop_rif_update(mlxsw_sp,
|
|
|
|
&ipip_entry->ol_lb->common);
|
|
|
|
}
|
2017-11-03 17:03:37 +08:00
|
|
|
|
|
|
|
if (ipip_entry->ol_dev->flags & IFF_UP)
|
|
|
|
mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry);
|
2017-10-16 22:26:38 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:37 +08:00
|
|
|
static int mlxsw_sp_netdevice_ipip_ol_vrf_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry =
|
|
|
|
mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
|
|
|
|
|
|
|
|
if (!ipip_entry)
|
|
|
|
return 0;
|
2017-11-28 20:17:12 +08:00
|
|
|
|
2017-11-03 17:03:37 +08:00
|
|
|
return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
|
2017-11-03 17:03:38 +08:00
|
|
|
true, false, false, extack);
|
2017-11-03 17:03:37 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:41 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_netdevice_ipip_ul_vrf_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
|
|
|
struct net_device *ul_dev,
|
2019-11-24 15:48:02 +08:00
|
|
|
bool *demote_this,
|
2017-11-03 17:03:41 +08:00
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
2019-11-24 15:48:02 +08:00
|
|
|
u32 ul_tb_id = l3mdev_fib_table(ul_dev) ? : RT_TABLE_MAIN;
|
|
|
|
enum mlxsw_sp_l3proto ul_proto;
|
|
|
|
union mlxsw_sp_l3addr saddr;
|
|
|
|
|
|
|
|
/* Moving underlay to a different VRF might cause local address
|
|
|
|
* conflict, and the conflicting tunnels need to be demoted.
|
|
|
|
*/
|
|
|
|
ul_proto = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]->ul_proto;
|
|
|
|
saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ipip_entry->ol_dev);
|
|
|
|
if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, ul_proto,
|
|
|
|
saddr, ul_tb_id,
|
|
|
|
ipip_entry)) {
|
|
|
|
*demote_this = true;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:41 +08:00
|
|
|
return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
|
|
|
|
true, true, false, extack);
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:44 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_netdevice_ipip_ul_up_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
|
|
|
struct net_device *ul_dev)
|
|
|
|
{
|
|
|
|
return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
|
|
|
|
false, false, true, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_netdevice_ipip_ul_down_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
|
|
|
struct net_device *ul_dev)
|
|
|
|
{
|
|
|
|
/* A down underlay device causes encapsulated packets to not be
|
|
|
|
* forwarded, but decap still works. So refresh next hops without
|
|
|
|
* touching anything else.
|
|
|
|
*/
|
|
|
|
return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
|
|
|
|
false, false, true, NULL);
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:42 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_netdevice_ipip_ol_change_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
|
|
|
|
if (!ipip_entry)
|
|
|
|
/* A change might make a tunnel eligible for offloading, but
|
|
|
|
* that is currently not implemented. What falls to slow path
|
|
|
|
* stays there.
|
|
|
|
*/
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
/* A change might make a tunnel not eligible for offloading. */
|
|
|
|
if (!mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev,
|
|
|
|
ipip_entry->ipipt)) {
|
|
|
|
mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
|
|
|
|
err = ipip_ops->ol_netdev_change(mlxsw_sp, ipip_entry, extack);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Onload conflicting tunnels
The approach for offloading IP tunnels implemented currently by mlxsw
doesn't allow two tunnels that have the same local IP address in the
same (underlay) VRF. Previously, offloads were introduced on demand as
encap routes were formed. When such a route was created that would cause
offload of a conflicting tunnel, mlxsw_sp_ipip_entry_create() would
detect it and return -EEXIST, which would propagate up and cause FIB
abort.
Now however IPIP entries are created as soon as an offloadable netdevice
is created, and the failure prevents creation of such device.
Furthermore, if the driver is installed at the point where such
conflicting tunnels exist, the failure actually prevents successful
modprobe.
Furthermore, follow-up patches implement handling of NETDEV_CHANGE due
to the local address change. However, NETDEV_CHANGE can't be vetoed. The
failure merely means that the offloads weren't updated, but the change
in Linux configuration is not rolled back. It is thus desirable to have
a robust way of handling these conflicts, which can later be reused for
handling NETDEV_CHANGE as well.
To fix this, when a conflicting tunnel is created, instead of failing,
simply pull the old tunnel to slow path and reject offloading the
new one.
Introduce two functions: mlxsw_sp_ipip_entry_demote_tunnel() and
mlxsw_sp_ipip_demote_tunnel_by_saddr() to handle this. Make them both
public, because they will be useful later on in this patchset.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-11-03 17:03:40 +08:00
|
|
|
void mlxsw_sp_ipip_entry_demote_tunnel(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
|
|
|
{
|
|
|
|
struct net_device *ol_dev = ipip_entry->ol_dev;
|
|
|
|
|
|
|
|
if (ol_dev->flags & IFF_UP)
|
|
|
|
mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry);
|
|
|
|
mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* The configuration where several tunnels have the same local address in the
|
|
|
|
* same underlay table needs special treatment in the HW. That is currently not
|
|
|
|
* implemented in the driver. This function finds and demotes the first tunnel
|
|
|
|
* with a given source address, except the one passed in in the argument
|
|
|
|
* `except'.
|
|
|
|
*/
|
|
|
|
bool
|
|
|
|
mlxsw_sp_ipip_demote_tunnel_by_saddr(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
union mlxsw_sp_l3addr saddr,
|
|
|
|
u32 ul_tb_id,
|
|
|
|
const struct mlxsw_sp_ipip_entry *except)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry, *tmp;
|
|
|
|
|
|
|
|
list_for_each_entry_safe(ipip_entry, tmp, &mlxsw_sp->router->ipip_list,
|
|
|
|
ipip_list_node) {
|
|
|
|
if (ipip_entry != except &&
|
|
|
|
mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, saddr,
|
|
|
|
ul_tb_id, ipip_entry)) {
|
|
|
|
mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:41 +08:00
|
|
|
static void mlxsw_sp_ipip_demote_tunnel_by_ul_netdev(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ul_dev)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry, *tmp;
|
|
|
|
|
|
|
|
list_for_each_entry_safe(ipip_entry, tmp, &mlxsw_sp->router->ipip_list,
|
|
|
|
ipip_list_node) {
|
2020-02-20 15:07:55 +08:00
|
|
|
struct net_device *ol_dev = ipip_entry->ol_dev;
|
|
|
|
struct net_device *ipip_ul_dev;
|
2017-11-03 17:03:41 +08:00
|
|
|
|
2020-02-20 15:07:55 +08:00
|
|
|
rcu_read_lock();
|
|
|
|
ipip_ul_dev = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
|
|
|
|
rcu_read_unlock();
|
2017-11-03 17:03:41 +08:00
|
|
|
if (ipip_ul_dev == ul_dev)
|
|
|
|
mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:36 +08:00
|
|
|
int mlxsw_sp_netdevice_ipip_ol_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ol_dev,
|
|
|
|
unsigned long event,
|
|
|
|
struct netdev_notifier_info *info)
|
2017-10-16 22:26:37 +08:00
|
|
|
{
|
2017-11-03 17:03:36 +08:00
|
|
|
struct netdev_notifier_changeupper_info *chup;
|
|
|
|
struct netlink_ext_ack *extack;
|
2020-02-22 01:54:12 +08:00
|
|
|
int err = 0;
|
2017-11-03 17:03:36 +08:00
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-10-16 22:26:37 +08:00
|
|
|
switch (event) {
|
|
|
|
case NETDEV_REGISTER:
|
2020-02-22 01:54:12 +08:00
|
|
|
err = mlxsw_sp_netdevice_ipip_ol_reg_event(mlxsw_sp, ol_dev);
|
|
|
|
break;
|
2017-10-16 22:26:37 +08:00
|
|
|
case NETDEV_UNREGISTER:
|
2017-11-03 17:03:29 +08:00
|
|
|
mlxsw_sp_netdevice_ipip_ol_unreg_event(mlxsw_sp, ol_dev);
|
2020-02-22 01:54:12 +08:00
|
|
|
break;
|
2017-10-16 22:26:37 +08:00
|
|
|
case NETDEV_UP:
|
2017-11-03 17:03:34 +08:00
|
|
|
mlxsw_sp_netdevice_ipip_ol_up_event(mlxsw_sp, ol_dev);
|
2020-02-22 01:54:12 +08:00
|
|
|
break;
|
2017-10-16 22:26:37 +08:00
|
|
|
case NETDEV_DOWN:
|
2017-11-03 17:03:29 +08:00
|
|
|
mlxsw_sp_netdevice_ipip_ol_down_event(mlxsw_sp, ol_dev);
|
2020-02-22 01:54:12 +08:00
|
|
|
break;
|
2017-10-16 22:26:38 +08:00
|
|
|
case NETDEV_CHANGEUPPER:
|
2017-11-03 17:03:36 +08:00
|
|
|
chup = container_of(info, typeof(*chup), info);
|
|
|
|
extack = info->extack;
|
|
|
|
if (netif_is_l3_master(chup->upper_dev))
|
2020-02-22 01:54:12 +08:00
|
|
|
err = mlxsw_sp_netdevice_ipip_ol_vrf_event(mlxsw_sp,
|
|
|
|
ol_dev,
|
|
|
|
extack);
|
|
|
|
break;
|
2017-11-03 17:03:42 +08:00
|
|
|
case NETDEV_CHANGE:
|
|
|
|
extack = info->extack;
|
2020-02-22 01:54:12 +08:00
|
|
|
err = mlxsw_sp_netdevice_ipip_ol_change_event(mlxsw_sp,
|
|
|
|
ol_dev, extack);
|
|
|
|
break;
|
2018-03-23 01:53:35 +08:00
|
|
|
case NETDEV_CHANGEMTU:
|
2020-02-22 01:54:12 +08:00
|
|
|
err = mlxsw_sp_netdevice_ipip_ol_update_mtu(mlxsw_sp, ol_dev);
|
|
|
|
break;
|
2017-10-16 22:26:37 +08:00
|
|
|
}
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
|
|
|
return err;
|
2017-10-16 22:26:37 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:41 +08:00
|
|
|
static int
|
|
|
|
__mlxsw_sp_netdevice_ipip_ul_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry,
|
|
|
|
struct net_device *ul_dev,
|
2019-11-24 15:48:02 +08:00
|
|
|
bool *demote_this,
|
2017-11-03 17:03:41 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netdev_notifier_info *info)
|
|
|
|
{
|
|
|
|
struct netdev_notifier_changeupper_info *chup;
|
|
|
|
struct netlink_ext_ack *extack;
|
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case NETDEV_CHANGEUPPER:
|
|
|
|
chup = container_of(info, typeof(*chup), info);
|
|
|
|
extack = info->extack;
|
|
|
|
if (netif_is_l3_master(chup->upper_dev))
|
|
|
|
return mlxsw_sp_netdevice_ipip_ul_vrf_event(mlxsw_sp,
|
|
|
|
ipip_entry,
|
|
|
|
ul_dev,
|
2019-11-24 15:48:02 +08:00
|
|
|
demote_this,
|
2017-11-03 17:03:41 +08:00
|
|
|
extack);
|
|
|
|
break;
|
2017-11-03 17:03:44 +08:00
|
|
|
|
|
|
|
case NETDEV_UP:
|
|
|
|
return mlxsw_sp_netdevice_ipip_ul_up_event(mlxsw_sp, ipip_entry,
|
|
|
|
ul_dev);
|
|
|
|
case NETDEV_DOWN:
|
|
|
|
return mlxsw_sp_netdevice_ipip_ul_down_event(mlxsw_sp,
|
|
|
|
ipip_entry,
|
|
|
|
ul_dev);
|
2017-11-03 17:03:41 +08:00
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
mlxsw_sp_netdevice_ipip_ul_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *ul_dev,
|
|
|
|
unsigned long event,
|
|
|
|
struct netdev_notifier_info *info)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry = NULL;
|
2020-02-22 01:54:12 +08:00
|
|
|
int err = 0;
|
2017-11-03 17:03:41 +08:00
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-11-03 17:03:41 +08:00
|
|
|
while ((ipip_entry = mlxsw_sp_ipip_entry_find_by_ul_dev(mlxsw_sp,
|
|
|
|
ul_dev,
|
|
|
|
ipip_entry))) {
|
2019-11-24 15:48:02 +08:00
|
|
|
struct mlxsw_sp_ipip_entry *prev;
|
|
|
|
bool demote_this = false;
|
|
|
|
|
2017-11-03 17:03:41 +08:00
|
|
|
err = __mlxsw_sp_netdevice_ipip_ul_event(mlxsw_sp, ipip_entry,
|
2019-11-24 15:48:02 +08:00
|
|
|
ul_dev, &demote_this,
|
|
|
|
event, info);
|
2017-11-03 17:03:41 +08:00
|
|
|
if (err) {
|
|
|
|
mlxsw_sp_ipip_demote_tunnel_by_ul_netdev(mlxsw_sp,
|
|
|
|
ul_dev);
|
2020-02-22 01:54:12 +08:00
|
|
|
break;
|
2017-11-03 17:03:41 +08:00
|
|
|
}
|
2019-11-24 15:48:02 +08:00
|
|
|
|
|
|
|
if (demote_this) {
|
|
|
|
if (list_is_first(&ipip_entry->ipip_list_node,
|
|
|
|
&mlxsw_sp->router->ipip_list))
|
|
|
|
prev = NULL;
|
|
|
|
else
|
|
|
|
/* This can't be cached from previous iteration,
|
|
|
|
* because that entry could be gone now.
|
|
|
|
*/
|
|
|
|
prev = list_prev_entry(ipip_entry,
|
|
|
|
ipip_list_node);
|
|
|
|
mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
|
|
|
|
ipip_entry = prev;
|
|
|
|
}
|
2017-11-03 17:03:41 +08:00
|
|
|
}
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-11-03 17:03:41 +08:00
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
return err;
|
2017-11-03 17:03:41 +08:00
|
|
|
}
|
|
|
|
|
2018-10-17 16:53:07 +08:00
|
|
|
int mlxsw_sp_router_nve_promote_decap(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id,
|
|
|
|
enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
const union mlxsw_sp_l3addr *ul_sip,
|
|
|
|
u32 tunnel_index)
|
|
|
|
{
|
|
|
|
enum mlxsw_sp_fib_entry_type type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
|
2020-02-22 01:54:08 +08:00
|
|
|
struct mlxsw_sp_router *router = mlxsw_sp->router;
|
2018-10-17 16:53:07 +08:00
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
|
|
|
int err;
|
|
|
|
|
2020-02-22 01:54:08 +08:00
|
|
|
if (WARN_ON_ONCE(router->nve_decap_config.valid))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
router->nve_decap_config.ul_tb_id = ul_tb_id;
|
|
|
|
router->nve_decap_config.tunnel_index = tunnel_index;
|
|
|
|
router->nve_decap_config.ul_proto = ul_proto;
|
|
|
|
router->nve_decap_config.ul_sip = *ul_sip;
|
|
|
|
router->nve_decap_config.valid = true;
|
|
|
|
|
2018-10-17 16:53:07 +08:00
|
|
|
/* It is valid to create a tunnel with a local IP and only later
|
|
|
|
* assign this IP address to a local interface
|
|
|
|
*/
|
|
|
|
fib_entry = mlxsw_sp_router_ip2me_fib_entry_find(mlxsw_sp, ul_tb_id,
|
|
|
|
ul_proto, ul_sip,
|
|
|
|
type);
|
|
|
|
if (!fib_entry)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
fib_entry->decap.tunnel_index = tunnel_index;
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP;
|
|
|
|
|
|
|
|
err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
|
|
|
|
if (err)
|
|
|
|
goto err_fib_entry_update;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_fib_entry_update:
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
|
|
|
|
mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
void mlxsw_sp_router_nve_demote_decap(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id,
|
|
|
|
enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
const union mlxsw_sp_l3addr *ul_sip)
|
|
|
|
{
|
|
|
|
enum mlxsw_sp_fib_entry_type type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP;
|
2020-02-22 01:54:08 +08:00
|
|
|
struct mlxsw_sp_router *router = mlxsw_sp->router;
|
2018-10-17 16:53:07 +08:00
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
|
|
|
|
2020-02-22 01:54:08 +08:00
|
|
|
if (WARN_ON_ONCE(!router->nve_decap_config.valid))
|
|
|
|
return;
|
|
|
|
|
|
|
|
router->nve_decap_config.valid = false;
|
|
|
|
|
2018-10-17 16:53:07 +08:00
|
|
|
fib_entry = mlxsw_sp_router_ip2me_fib_entry_find(mlxsw_sp, ul_tb_id,
|
|
|
|
ul_proto, ul_sip,
|
|
|
|
type);
|
|
|
|
if (!fib_entry)
|
|
|
|
return;
|
|
|
|
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
|
|
|
|
mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
|
|
|
|
}
|
|
|
|
|
2020-02-22 01:54:08 +08:00
|
|
|
static bool mlxsw_sp_router_nve_is_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
u32 ul_tb_id,
|
|
|
|
enum mlxsw_sp_l3proto ul_proto,
|
|
|
|
const union mlxsw_sp_l3addr *ul_sip)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_router *router = mlxsw_sp->router;
|
|
|
|
|
|
|
|
return router->nve_decap_config.valid &&
|
|
|
|
router->nve_decap_config.ul_tb_id == ul_tb_id &&
|
|
|
|
router->nve_decap_config.ul_proto == ul_proto &&
|
|
|
|
!memcmp(&router->nve_decap_config.ul_sip, ul_sip,
|
|
|
|
sizeof(*ul_sip));
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:39 +08:00
|
|
|
struct mlxsw_sp_neigh_key {
|
2016-11-10 19:31:04 +08:00
|
|
|
struct neighbour *n;
|
2016-07-05 17:27:39 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlxsw_sp_neigh_entry {
|
2017-02-08 18:16:42 +08:00
|
|
|
struct list_head rif_list_node;
|
2016-07-05 17:27:39 +08:00
|
|
|
struct rhash_head ht_node;
|
|
|
|
struct mlxsw_sp_neigh_key key;
|
|
|
|
u16 rif;
|
2017-02-06 23:20:13 +08:00
|
|
|
bool connected;
|
2016-07-05 17:27:44 +08:00
|
|
|
unsigned char ha[ETH_ALEN];
|
2016-07-05 17:27:50 +08:00
|
|
|
struct list_head nexthop_list; /* list of nexthops using
|
|
|
|
* this neigh entry
|
|
|
|
*/
|
2016-07-05 17:27:51 +08:00
|
|
|
struct list_head nexthop_neighs_list_node;
|
2017-08-24 14:40:08 +08:00
|
|
|
unsigned int counter_index;
|
|
|
|
bool counter_valid;
|
2016-07-05 17:27:39 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static const struct rhashtable_params mlxsw_sp_neigh_ht_params = {
|
|
|
|
.key_offset = offsetof(struct mlxsw_sp_neigh_entry, key),
|
|
|
|
.head_offset = offsetof(struct mlxsw_sp_neigh_entry, ht_node),
|
|
|
|
.key_len = sizeof(struct mlxsw_sp_neigh_key),
|
|
|
|
};
|
|
|
|
|
2017-08-24 14:40:04 +08:00
|
|
|
struct mlxsw_sp_neigh_entry *
|
|
|
|
mlxsw_sp_rif_neigh_next(struct mlxsw_sp_rif *rif,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
if (!neigh_entry) {
|
|
|
|
if (list_empty(&rif->neigh_list))
|
|
|
|
return NULL;
|
|
|
|
else
|
|
|
|
return list_first_entry(&rif->neigh_list,
|
|
|
|
typeof(*neigh_entry),
|
|
|
|
rif_list_node);
|
|
|
|
}
|
2017-09-25 16:32:24 +08:00
|
|
|
if (list_is_last(&neigh_entry->rif_list_node, &rif->neigh_list))
|
2017-08-24 14:40:04 +08:00
|
|
|
return NULL;
|
|
|
|
return list_next_entry(neigh_entry, rif_list_node);
|
|
|
|
}
|
|
|
|
|
|
|
|
int mlxsw_sp_neigh_entry_type(struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
return neigh_entry->key.n->tbl->family;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned char *
|
|
|
|
mlxsw_sp_neigh_entry_ha(struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
return neigh_entry->ha;
|
|
|
|
}
|
|
|
|
|
|
|
|
u32 mlxsw_sp_neigh4_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
struct neighbour *n;
|
|
|
|
|
|
|
|
n = neigh_entry->key.n;
|
|
|
|
return ntohl(*((__be32 *) n->primary_key));
|
|
|
|
}
|
|
|
|
|
2017-08-31 23:59:15 +08:00
|
|
|
struct in6_addr *
|
|
|
|
mlxsw_sp_neigh6_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
struct neighbour *n;
|
|
|
|
|
|
|
|
n = neigh_entry->key.n;
|
|
|
|
return (struct in6_addr *) &n->primary_key;
|
|
|
|
}
|
|
|
|
|
2017-08-24 14:40:08 +08:00
|
|
|
int mlxsw_sp_neigh_counter_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
|
|
|
u64 *p_counter)
|
|
|
|
{
|
|
|
|
if (!neigh_entry->counter_valid)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
return mlxsw_sp_flow_counter_get(mlxsw_sp, neigh_entry->counter_index,
|
|
|
|
p_counter, NULL);
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:39 +08:00
|
|
|
static struct mlxsw_sp_neigh_entry *
|
2017-02-06 23:20:13 +08:00
|
|
|
mlxsw_sp_neigh_entry_alloc(struct mlxsw_sp *mlxsw_sp, struct neighbour *n,
|
|
|
|
u16 rif)
|
2016-07-05 17:27:39 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
neigh_entry = kzalloc(sizeof(*neigh_entry), GFP_KERNEL);
|
2016-07-05 17:27:39 +08:00
|
|
|
if (!neigh_entry)
|
|
|
|
return NULL;
|
2017-02-06 23:20:13 +08:00
|
|
|
|
2016-11-10 19:31:04 +08:00
|
|
|
neigh_entry->key.n = n;
|
2016-07-05 17:27:39 +08:00
|
|
|
neigh_entry->rif = rif;
|
2016-07-05 17:27:50 +08:00
|
|
|
INIT_LIST_HEAD(&neigh_entry->nexthop_list);
|
2017-02-06 23:20:13 +08:00
|
|
|
|
2016-07-05 17:27:39 +08:00
|
|
|
return neigh_entry;
|
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static void mlxsw_sp_neigh_entry_free(struct mlxsw_sp_neigh_entry *neigh_entry)
|
2016-07-05 17:27:39 +08:00
|
|
|
{
|
|
|
|
kfree(neigh_entry);
|
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_neigh_entry_insert(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
2016-07-05 17:27:39 +08:00
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
return rhashtable_insert_fast(&mlxsw_sp->router->neigh_ht,
|
2017-02-06 23:20:13 +08:00
|
|
|
&neigh_entry->ht_node,
|
|
|
|
mlxsw_sp_neigh_ht_params);
|
|
|
|
}
|
2016-07-05 17:27:39 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_neigh_entry_remove(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
rhashtable_remove_fast(&mlxsw_sp->router->neigh_ht,
|
2017-02-06 23:20:13 +08:00
|
|
|
&neigh_entry->ht_node,
|
|
|
|
mlxsw_sp_neigh_ht_params);
|
2016-07-05 17:27:39 +08:00
|
|
|
}
|
|
|
|
|
2017-08-24 14:40:08 +08:00
|
|
|
static bool
|
2017-08-31 23:59:18 +08:00
|
|
|
mlxsw_sp_neigh_counter_should_alloc(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
2017-08-24 14:40:08 +08:00
|
|
|
{
|
|
|
|
struct devlink *devlink;
|
2017-08-31 23:59:18 +08:00
|
|
|
const char *table_name;
|
|
|
|
|
|
|
|
switch (mlxsw_sp_neigh_entry_type(neigh_entry)) {
|
|
|
|
case AF_INET:
|
|
|
|
table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST4;
|
|
|
|
break;
|
|
|
|
case AF_INET6:
|
|
|
|
table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST6;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
WARN_ON(1);
|
|
|
|
return false;
|
|
|
|
}
|
2017-08-24 14:40:08 +08:00
|
|
|
|
|
|
|
devlink = priv_to_devlink(mlxsw_sp->core);
|
2017-08-31 23:59:18 +08:00
|
|
|
return devlink_dpipe_table_counter_enabled(devlink, table_name);
|
2017-08-24 14:40:08 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_neigh_counter_alloc(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
2017-08-31 23:59:18 +08:00
|
|
|
if (!mlxsw_sp_neigh_counter_should_alloc(mlxsw_sp, neigh_entry))
|
2017-08-24 14:40:08 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &neigh_entry->counter_index))
|
|
|
|
return;
|
|
|
|
|
|
|
|
neigh_entry->counter_valid = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_neigh_counter_free(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
if (!neigh_entry->counter_valid)
|
|
|
|
return;
|
|
|
|
mlxsw_sp_flow_counter_free(mlxsw_sp,
|
|
|
|
neigh_entry->counter_index);
|
|
|
|
neigh_entry->counter_valid = false;
|
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static struct mlxsw_sp_neigh_entry *
|
|
|
|
mlxsw_sp_neigh_entry_create(struct mlxsw_sp *mlxsw_sp, struct neighbour *n)
|
2016-07-05 17:27:39 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2016-07-05 17:27:39 +08:00
|
|
|
int err;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, n->dev);
|
|
|
|
if (!rif)
|
2017-02-06 23:20:13 +08:00
|
|
|
return ERR_PTR(-EINVAL);
|
2016-07-05 17:27:39 +08:00
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
neigh_entry = mlxsw_sp_neigh_entry_alloc(mlxsw_sp, n, rif->rif_index);
|
2016-07-05 17:27:39 +08:00
|
|
|
if (!neigh_entry)
|
2017-02-06 23:20:13 +08:00
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
|
2016-07-05 17:27:39 +08:00
|
|
|
err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
|
|
|
|
if (err)
|
|
|
|
goto err_neigh_entry_insert;
|
2017-02-06 23:20:13 +08:00
|
|
|
|
2017-08-24 14:40:08 +08:00
|
|
|
mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry);
|
2017-03-17 16:38:00 +08:00
|
|
|
list_add(&neigh_entry->rif_list_node, &rif->neigh_list);
|
2017-02-08 18:16:42 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
return neigh_entry;
|
2016-07-05 17:27:39 +08:00
|
|
|
|
|
|
|
err_neigh_entry_insert:
|
2017-02-06 23:20:13 +08:00
|
|
|
mlxsw_sp_neigh_entry_free(neigh_entry);
|
|
|
|
return ERR_PTR(err);
|
2016-07-05 17:27:39 +08:00
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_neigh_entry_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
2016-07-05 17:27:39 +08:00
|
|
|
{
|
2017-02-08 18:16:42 +08:00
|
|
|
list_del(&neigh_entry->rif_list_node);
|
2017-08-24 14:40:08 +08:00
|
|
|
mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry);
|
2017-02-06 23:20:13 +08:00
|
|
|
mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry);
|
|
|
|
mlxsw_sp_neigh_entry_free(neigh_entry);
|
|
|
|
}
|
2016-07-05 17:27:39 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static struct mlxsw_sp_neigh_entry *
|
|
|
|
mlxsw_sp_neigh_entry_lookup(struct mlxsw_sp *mlxsw_sp, struct neighbour *n)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_key key;
|
2016-07-05 17:27:39 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
key.n = n;
|
2017-05-17 01:38:25 +08:00
|
|
|
return rhashtable_lookup_fast(&mlxsw_sp->router->neigh_ht,
|
2017-02-06 23:20:13 +08:00
|
|
|
&key, mlxsw_sp_neigh_ht_params);
|
2016-07-05 17:27:39 +08:00
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:43 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_router_neighs_update_interval_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2017-07-18 16:10:18 +08:00
|
|
|
unsigned long interval;
|
2016-07-05 17:27:43 +08:00
|
|
|
|
2017-07-24 15:56:00 +08:00
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
2017-07-18 16:10:18 +08:00
|
|
|
interval = min_t(unsigned long,
|
|
|
|
NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME),
|
|
|
|
NEIGH_VAR(&nd_tbl.parms, DELAY_PROBE_TIME));
|
2017-07-24 15:56:00 +08:00
|
|
|
#else
|
|
|
|
interval = NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME);
|
|
|
|
#endif
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp->router->neighs_update.interval = jiffies_to_msecs(interval);
|
2016-07-05 17:27:43 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_neigh_ent_ipv4_process(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl,
|
|
|
|
int ent_index)
|
|
|
|
{
|
|
|
|
struct net_device *dev;
|
|
|
|
struct neighbour *n;
|
|
|
|
__be32 dipn;
|
|
|
|
u32 dip;
|
|
|
|
u16 rif;
|
|
|
|
|
|
|
|
mlxsw_reg_rauhtd_ent_ipv4_unpack(rauhtd_pl, ent_index, &rif, &dip);
|
|
|
|
|
2017-05-17 01:38:27 +08:00
|
|
|
if (!mlxsw_sp->router->rifs[rif]) {
|
2016-07-05 17:27:43 +08:00
|
|
|
dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
dipn = htonl(dip);
|
2017-05-17 01:38:27 +08:00
|
|
|
dev = mlxsw_sp->router->rifs[rif]->dev;
|
2016-07-05 17:27:43 +08:00
|
|
|
n = neigh_lookup(&arp_tbl, &dipn, dev);
|
2018-01-24 17:02:09 +08:00
|
|
|
if (!n)
|
2016-07-05 17:27:43 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
netdev_dbg(dev, "Updating neighbour with IP=%pI4h\n", &dip);
|
|
|
|
neigh_event_send(n, NULL);
|
|
|
|
neigh_release(n);
|
|
|
|
}
|
|
|
|
|
2017-08-15 15:10:33 +08:00
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
2017-07-18 16:10:17 +08:00
|
|
|
static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl,
|
|
|
|
int rec_index)
|
|
|
|
{
|
|
|
|
struct net_device *dev;
|
|
|
|
struct neighbour *n;
|
|
|
|
struct in6_addr dip;
|
|
|
|
u16 rif;
|
|
|
|
|
|
|
|
mlxsw_reg_rauhtd_ent_ipv6_unpack(rauhtd_pl, rec_index, &rif,
|
|
|
|
(char *) &dip);
|
|
|
|
|
|
|
|
if (!mlxsw_sp->router->rifs[rif]) {
|
|
|
|
dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
dev = mlxsw_sp->router->rifs[rif]->dev;
|
|
|
|
n = neigh_lookup(&nd_tbl, &dip, dev);
|
2018-01-24 17:02:09 +08:00
|
|
|
if (!n)
|
2017-07-18 16:10:17 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
netdev_dbg(dev, "Updating neighbour with IP=%pI6c\n", &dip);
|
|
|
|
neigh_event_send(n, NULL);
|
|
|
|
neigh_release(n);
|
|
|
|
}
|
2017-07-24 15:56:00 +08:00
|
|
|
#else
|
|
|
|
static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl,
|
|
|
|
int rec_index)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
#endif
|
2017-07-18 16:10:17 +08:00
|
|
|
|
2016-07-05 17:27:43 +08:00
|
|
|
static void mlxsw_sp_router_neigh_rec_ipv4_process(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl,
|
|
|
|
int rec_index)
|
|
|
|
{
|
|
|
|
u8 num_entries;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl,
|
|
|
|
rec_index);
|
|
|
|
/* Hardware starts counting at 0, so add 1. */
|
|
|
|
num_entries++;
|
|
|
|
|
|
|
|
/* Each record consists of several neighbour entries. */
|
|
|
|
for (i = 0; i < num_entries; i++) {
|
|
|
|
int ent_index;
|
|
|
|
|
|
|
|
ent_index = rec_index * MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC + i;
|
|
|
|
mlxsw_sp_router_neigh_ent_ipv4_process(mlxsw_sp, rauhtd_pl,
|
|
|
|
ent_index);
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:17 +08:00
|
|
|
static void mlxsw_sp_router_neigh_rec_ipv6_process(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl,
|
|
|
|
int rec_index)
|
|
|
|
{
|
|
|
|
/* One record contains one entry. */
|
|
|
|
mlxsw_sp_router_neigh_ent_ipv6_process(mlxsw_sp, rauhtd_pl,
|
|
|
|
rec_index);
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:43 +08:00
|
|
|
static void mlxsw_sp_router_neigh_rec_process(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl, int rec_index)
|
|
|
|
{
|
|
|
|
switch (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, rec_index)) {
|
|
|
|
case MLXSW_REG_RAUHTD_TYPE_IPV4:
|
|
|
|
mlxsw_sp_router_neigh_rec_ipv4_process(mlxsw_sp, rauhtd_pl,
|
|
|
|
rec_index);
|
|
|
|
break;
|
|
|
|
case MLXSW_REG_RAUHTD_TYPE_IPV6:
|
2017-07-18 16:10:17 +08:00
|
|
|
mlxsw_sp_router_neigh_rec_ipv6_process(mlxsw_sp, rauhtd_pl,
|
|
|
|
rec_index);
|
2016-07-05 17:27:43 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-11-11 23:34:26 +08:00
|
|
|
static bool mlxsw_sp_router_rauhtd_is_full(char *rauhtd_pl)
|
|
|
|
{
|
|
|
|
u8 num_rec, last_rec_index, num_entries;
|
|
|
|
|
|
|
|
num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl);
|
|
|
|
last_rec_index = num_rec - 1;
|
|
|
|
|
|
|
|
if (num_rec < MLXSW_REG_RAUHTD_REC_MAX_NUM)
|
|
|
|
return false;
|
|
|
|
if (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, last_rec_index) ==
|
|
|
|
MLXSW_REG_RAUHTD_TYPE_IPV6)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl,
|
|
|
|
last_rec_index);
|
|
|
|
if (++num_entries == MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC)
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:17 +08:00
|
|
|
static int
|
|
|
|
__mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
char *rauhtd_pl,
|
|
|
|
enum mlxsw_reg_rauhtd_type type)
|
2016-07-05 17:27:43 +08:00
|
|
|
{
|
2017-07-18 16:10:17 +08:00
|
|
|
int i, num_rec;
|
|
|
|
int err;
|
2016-07-05 17:27:43 +08:00
|
|
|
|
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
/* Ensure the RIF we read from the device does not change mid-dump. */
|
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2016-07-05 17:27:43 +08:00
|
|
|
do {
|
2017-07-18 16:10:17 +08:00
|
|
|
mlxsw_reg_rauhtd_pack(rauhtd_pl, type);
|
2016-07-05 17:27:43 +08:00
|
|
|
err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(rauhtd),
|
|
|
|
rauhtd_pl);
|
|
|
|
if (err) {
|
2017-10-02 18:21:57 +08:00
|
|
|
dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Failed to dump neighbour table\n");
|
2016-07-05 17:27:43 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl);
|
|
|
|
for (i = 0; i < num_rec; i++)
|
|
|
|
mlxsw_sp_router_neigh_rec_process(mlxsw_sp, rauhtd_pl,
|
|
|
|
i);
|
2016-11-11 23:34:26 +08:00
|
|
|
} while (mlxsw_sp_router_rauhtd_is_full(rauhtd_pl));
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2016-07-05 17:27:43 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
|
2017-07-18 16:10:17 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
enum mlxsw_reg_rauhtd_type type;
|
|
|
|
char *rauhtd_pl;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
rauhtd_pl = kmalloc(MLXSW_REG_RAUHTD_LEN, GFP_KERNEL);
|
|
|
|
if (!rauhtd_pl)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
type = MLXSW_REG_RAUHTD_TYPE_IPV4;
|
|
|
|
err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type);
|
|
|
|
if (err)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
type = MLXSW_REG_RAUHTD_TYPE_IPV6;
|
|
|
|
err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type);
|
|
|
|
out:
|
2016-07-05 17:27:43 +08:00
|
|
|
kfree(rauhtd_pl);
|
2016-07-05 17:27:51 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_neighs_update_nh(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
|
|
|
|
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-05-17 01:38:25 +08:00
|
|
|
list_for_each_entry(neigh_entry, &mlxsw_sp->router->nexthop_neighs_list,
|
2017-02-06 23:20:15 +08:00
|
|
|
nexthop_neighs_list_node)
|
2016-07-05 17:27:51 +08:00
|
|
|
/* If this neigh have nexthops, make the kernel think this neigh
|
|
|
|
* is active regardless of the traffic.
|
|
|
|
*/
|
2017-02-06 23:20:15 +08:00
|
|
|
neigh_event_send(neigh_entry->key.n, NULL);
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2016-07-05 17:27:51 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_router_neighs_update_work_schedule(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
unsigned long interval = mlxsw_sp->router->neighs_update.interval;
|
2016-07-05 17:27:51 +08:00
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw,
|
2016-07-05 17:27:51 +08:00
|
|
|
msecs_to_jiffies(interval));
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_neighs_update_work(struct work_struct *work)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2016-07-05 17:27:51 +08:00
|
|
|
int err;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
router = container_of(work, struct mlxsw_sp_router,
|
|
|
|
neighs_update.dw.work);
|
|
|
|
err = mlxsw_sp_router_neighs_update_rauhtd(router->mlxsw_sp);
|
2016-07-05 17:27:51 +08:00
|
|
|
if (err)
|
2017-05-17 01:38:25 +08:00
|
|
|
dev_err(router->mlxsw_sp->bus_info->dev, "Could not update kernel for neigh activity");
|
2016-07-05 17:27:51 +08:00
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp_router_neighs_update_nh(router->mlxsw_sp);
|
2016-07-05 17:27:51 +08:00
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp_router_neighs_update_work_schedule(router->mlxsw_sp);
|
2016-07-05 17:27:43 +08:00
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:52 +08:00
|
|
|
static void mlxsw_sp_router_probe_unresolved_nexthops(struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2016-07-05 17:27:52 +08:00
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
router = container_of(work, struct mlxsw_sp_router,
|
|
|
|
nexthop_probe_dw.work);
|
2016-07-05 17:27:52 +08:00
|
|
|
/* Iterate over nexthop neighbours, find those who are unresolved and
|
|
|
|
* send arp on them. This solves the chicken-egg problem when
|
|
|
|
* the nexthop wouldn't get offloaded until the neighbor is resolved
|
|
|
|
* but it wouldn't get resolved ever in case traffic is flowing in HW
|
|
|
|
* using different nexthop.
|
|
|
|
*/
|
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&router->lock);
|
2017-05-17 01:38:25 +08:00
|
|
|
list_for_each_entry(neigh_entry, &router->nexthop_neighs_list,
|
2017-02-06 23:20:15 +08:00
|
|
|
nexthop_neighs_list_node)
|
2017-02-06 23:20:16 +08:00
|
|
|
if (!neigh_entry->connected)
|
2016-11-10 19:31:04 +08:00
|
|
|
neigh_event_send(neigh_entry->key.n, NULL);
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&router->lock);
|
2016-07-05 17:27:52 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_core_schedule_dw(&router->nexthop_probe_dw,
|
2016-07-05 17:27:52 +08:00
|
|
|
MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL);
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
2019-06-11 15:19:41 +08:00
|
|
|
bool removing, bool dead);
|
2016-07-05 17:27:50 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static enum mlxsw_reg_rauht_op mlxsw_sp_rauht_op(bool adding)
|
|
|
|
{
|
|
|
|
return adding ? MLXSW_REG_RAUHT_OP_WRITE_ADD :
|
|
|
|
MLXSW_REG_RAUHT_OP_WRITE_DELETE;
|
|
|
|
}
|
|
|
|
|
2019-04-15 02:57:47 +08:00
|
|
|
static int
|
2017-02-06 23:20:13 +08:00
|
|
|
mlxsw_sp_router_neigh_entry_op4(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
|
|
|
enum mlxsw_reg_rauht_op op)
|
2016-07-05 17:27:44 +08:00
|
|
|
{
|
2016-11-10 19:31:04 +08:00
|
|
|
struct neighbour *n = neigh_entry->key.n;
|
2017-02-06 23:20:13 +08:00
|
|
|
u32 dip = ntohl(*((__be32 *) n->primary_key));
|
2016-07-05 17:27:44 +08:00
|
|
|
char rauht_pl[MLXSW_REG_RAUHT_LEN];
|
2017-02-06 23:20:13 +08:00
|
|
|
|
|
|
|
mlxsw_reg_rauht_pack4(rauht_pl, op, neigh_entry->rif, neigh_entry->ha,
|
|
|
|
dip);
|
2017-08-24 14:40:08 +08:00
|
|
|
if (neigh_entry->counter_valid)
|
|
|
|
mlxsw_reg_rauht_pack_counter(rauht_pl,
|
|
|
|
neigh_entry->counter_index);
|
2019-04-15 02:57:47 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl);
|
2017-02-06 23:20:13 +08:00
|
|
|
}
|
|
|
|
|
2019-04-15 02:57:47 +08:00
|
|
|
static int
|
2017-07-18 16:10:15 +08:00
|
|
|
mlxsw_sp_router_neigh_entry_op6(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
|
|
|
enum mlxsw_reg_rauht_op op)
|
|
|
|
{
|
|
|
|
struct neighbour *n = neigh_entry->key.n;
|
|
|
|
char rauht_pl[MLXSW_REG_RAUHT_LEN];
|
|
|
|
const char *dip = n->primary_key;
|
|
|
|
|
|
|
|
mlxsw_reg_rauht_pack6(rauht_pl, op, neigh_entry->rif, neigh_entry->ha,
|
|
|
|
dip);
|
2017-08-24 14:40:08 +08:00
|
|
|
if (neigh_entry->counter_valid)
|
|
|
|
mlxsw_reg_rauht_pack_counter(rauht_pl,
|
|
|
|
neigh_entry->counter_index);
|
2019-04-15 02:57:47 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl);
|
2017-07-18 16:10:15 +08:00
|
|
|
}
|
|
|
|
|
2017-08-31 23:59:13 +08:00
|
|
|
bool mlxsw_sp_neigh_ipv6_ignore(struct mlxsw_sp_neigh_entry *neigh_entry)
|
2017-07-18 16:10:15 +08:00
|
|
|
{
|
2017-08-31 23:59:13 +08:00
|
|
|
struct neighbour *n = neigh_entry->key.n;
|
|
|
|
|
2017-07-18 16:10:15 +08:00
|
|
|
/* Packets with a link-local destination address are trapped
|
|
|
|
* after LPM lookup and never reach the neighbour table, so
|
|
|
|
* there is no need to program such neighbours to the device.
|
|
|
|
*/
|
|
|
|
if (ipv6_addr_type((struct in6_addr *) &n->primary_key) &
|
|
|
|
IPV6_ADDR_LINKLOCAL)
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_neigh_entry_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
|
|
|
bool adding)
|
|
|
|
{
|
2019-04-15 02:57:47 +08:00
|
|
|
enum mlxsw_reg_rauht_op op = mlxsw_sp_rauht_op(adding);
|
|
|
|
int err;
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
if (!adding && !neigh_entry->connected)
|
|
|
|
return;
|
|
|
|
neigh_entry->connected = adding;
|
2017-07-24 15:56:00 +08:00
|
|
|
if (neigh_entry->key.n->tbl->family == AF_INET) {
|
2019-04-15 02:57:47 +08:00
|
|
|
err = mlxsw_sp_router_neigh_entry_op4(mlxsw_sp, neigh_entry,
|
|
|
|
op);
|
|
|
|
if (err)
|
|
|
|
return;
|
2017-07-24 15:56:00 +08:00
|
|
|
} else if (neigh_entry->key.n->tbl->family == AF_INET6) {
|
2017-08-31 23:59:13 +08:00
|
|
|
if (mlxsw_sp_neigh_ipv6_ignore(neigh_entry))
|
2017-07-18 16:10:15 +08:00
|
|
|
return;
|
2019-04-15 02:57:47 +08:00
|
|
|
err = mlxsw_sp_router_neigh_entry_op6(mlxsw_sp, neigh_entry,
|
|
|
|
op);
|
|
|
|
if (err)
|
|
|
|
return;
|
2017-07-18 16:10:15 +08:00
|
|
|
} else {
|
2017-02-06 23:20:13 +08:00
|
|
|
WARN_ON_ONCE(1);
|
2019-04-15 02:57:49 +08:00
|
|
|
return;
|
2017-07-18 16:10:15 +08:00
|
|
|
}
|
2019-04-15 02:57:49 +08:00
|
|
|
|
|
|
|
if (adding)
|
|
|
|
neigh_entry->key.n->flags |= NTF_OFFLOADED;
|
|
|
|
else
|
|
|
|
neigh_entry->key.n->flags &= ~NTF_OFFLOADED;
|
2017-02-06 23:20:13 +08:00
|
|
|
}
|
|
|
|
|
2017-08-24 14:40:10 +08:00
|
|
|
void
|
|
|
|
mlxsw_sp_neigh_entry_counter_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
|
|
|
bool adding)
|
|
|
|
{
|
|
|
|
if (adding)
|
|
|
|
mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry);
|
|
|
|
else
|
|
|
|
mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry);
|
|
|
|
mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, true);
|
|
|
|
}
|
|
|
|
|
2017-11-03 00:14:07 +08:00
|
|
|
struct mlxsw_sp_netevent_work {
|
2017-02-06 23:20:13 +08:00
|
|
|
struct work_struct work;
|
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
struct neighbour *n;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_neigh_event_work(struct work_struct *work)
|
|
|
|
{
|
2017-11-03 00:14:07 +08:00
|
|
|
struct mlxsw_sp_netevent_work *net_work =
|
|
|
|
container_of(work, struct mlxsw_sp_netevent_work, work);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
|
2017-02-06 23:20:13 +08:00
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
2017-11-03 00:14:07 +08:00
|
|
|
struct neighbour *n = net_work->n;
|
2017-02-06 23:20:13 +08:00
|
|
|
unsigned char ha[ETH_ALEN];
|
2016-07-05 17:27:44 +08:00
|
|
|
bool entry_connected;
|
2016-12-23 16:32:49 +08:00
|
|
|
u8 nud_state, dead;
|
2016-07-05 17:27:44 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
/* If these parameters are changed after we release the lock,
|
|
|
|
* then we are guaranteed to receive another event letting us
|
|
|
|
* know about it.
|
|
|
|
*/
|
2016-07-05 17:27:44 +08:00
|
|
|
read_lock_bh(&n->lock);
|
2017-02-06 23:20:13 +08:00
|
|
|
memcpy(ha, n->ha, ETH_ALEN);
|
2016-07-05 17:27:44 +08:00
|
|
|
nud_state = n->nud_state;
|
2016-12-23 16:32:49 +08:00
|
|
|
dead = n->dead;
|
2016-07-05 17:27:44 +08:00
|
|
|
read_unlock_bh(&n->lock);
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2018-02-27 21:53:46 +08:00
|
|
|
mlxsw_sp_span_respin(mlxsw_sp);
|
|
|
|
|
2016-12-23 16:32:49 +08:00
|
|
|
entry_connected = nud_state & NUD_VALID && !dead;
|
2017-02-06 23:20:13 +08:00
|
|
|
neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n);
|
|
|
|
if (!entry_connected && !neigh_entry)
|
|
|
|
goto out;
|
|
|
|
if (!neigh_entry) {
|
|
|
|
neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n);
|
|
|
|
if (IS_ERR(neigh_entry))
|
|
|
|
goto out;
|
2016-07-05 17:27:44 +08:00
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
memcpy(neigh_entry->ha, ha, ETH_ALEN);
|
|
|
|
mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, entry_connected);
|
2019-06-11 15:19:41 +08:00
|
|
|
mlxsw_sp_nexthop_neigh_update(mlxsw_sp, neigh_entry, !entry_connected,
|
|
|
|
dead);
|
2017-02-06 23:20:13 +08:00
|
|
|
|
|
|
|
if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list))
|
|
|
|
mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
|
|
|
|
|
|
|
|
out:
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-02-06 23:20:13 +08:00
|
|
|
rtnl_unlock();
|
2016-07-05 17:27:44 +08:00
|
|
|
neigh_release(n);
|
2017-11-03 00:14:07 +08:00
|
|
|
kfree(net_work);
|
2016-07-05 17:27:44 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 00:14:10 +08:00
|
|
|
static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp);
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_mp_hash_event_work(struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_netevent_work *net_work =
|
|
|
|
container_of(work, struct mlxsw_sp_netevent_work, work);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
|
|
|
|
|
|
|
|
mlxsw_sp_mp_hash_init(mlxsw_sp);
|
|
|
|
kfree(net_work);
|
|
|
|
}
|
|
|
|
|
2018-08-01 06:38:03 +08:00
|
|
|
static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp);
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_update_priority_work(struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_netevent_work *net_work =
|
|
|
|
container_of(work, struct mlxsw_sp_netevent_work, work);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
|
|
|
|
|
|
|
|
__mlxsw_sp_router_init(mlxsw_sp);
|
|
|
|
kfree(net_work);
|
|
|
|
}
|
|
|
|
|
2018-08-01 06:37:36 +08:00
|
|
|
static int mlxsw_sp_router_schedule_work(struct net *net,
|
|
|
|
struct notifier_block *nb,
|
|
|
|
void (*cb)(struct work_struct *))
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_netevent_work *net_work;
|
|
|
|
struct mlxsw_sp_router *router;
|
|
|
|
|
2019-10-03 17:49:32 +08:00
|
|
|
router = container_of(nb, struct mlxsw_sp_router, netevent_nb);
|
|
|
|
if (!net_eq(net, mlxsw_sp_net(router->mlxsw_sp)))
|
2018-08-01 06:37:36 +08:00
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
|
|
|
net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
|
|
|
|
if (!net_work)
|
|
|
|
return NOTIFY_BAD;
|
|
|
|
|
|
|
|
INIT_WORK(&net_work->work, cb);
|
|
|
|
net_work->mlxsw_sp = router->mlxsw_sp;
|
|
|
|
mlxsw_core_schedule_work(&net_work->work);
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
}
|
|
|
|
|
2017-11-03 00:14:10 +08:00
|
|
|
static int mlxsw_sp_router_netevent_event(struct notifier_block *nb,
|
2017-11-03 00:14:06 +08:00
|
|
|
unsigned long event, void *ptr)
|
2016-07-05 17:27:43 +08:00
|
|
|
{
|
2017-11-03 00:14:07 +08:00
|
|
|
struct mlxsw_sp_netevent_work *net_work;
|
2016-07-05 17:27:43 +08:00
|
|
|
struct mlxsw_sp_port *mlxsw_sp_port;
|
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
unsigned long interval;
|
|
|
|
struct neigh_parms *p;
|
2016-07-05 17:27:44 +08:00
|
|
|
struct neighbour *n;
|
2016-07-05 17:27:43 +08:00
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case NETEVENT_DELAY_PROBE_TIME_UPDATE:
|
|
|
|
p = ptr;
|
|
|
|
|
|
|
|
/* We don't care about changes in the default table. */
|
2017-07-24 15:56:00 +08:00
|
|
|
if (!p->dev || (p->tbl->family != AF_INET &&
|
|
|
|
p->tbl->family != AF_INET6))
|
2016-07-05 17:27:43 +08:00
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
|
|
|
/* We are in atomic context and can't take RTNL mutex,
|
|
|
|
* so use RCU variant to walk the device chain.
|
|
|
|
*/
|
|
|
|
mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(p->dev);
|
|
|
|
if (!mlxsw_sp_port)
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
|
|
|
mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
|
|
|
|
interval = jiffies_to_msecs(NEIGH_VAR(p, DELAY_PROBE_TIME));
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp->router->neighs_update.interval = interval;
|
2016-07-05 17:27:43 +08:00
|
|
|
|
|
|
|
mlxsw_sp_port_dev_put(mlxsw_sp_port);
|
|
|
|
break;
|
2016-07-05 17:27:44 +08:00
|
|
|
case NETEVENT_NEIGH_UPDATE:
|
|
|
|
n = ptr;
|
|
|
|
|
2017-07-24 15:56:00 +08:00
|
|
|
if (n->tbl->family != AF_INET && n->tbl->family != AF_INET6)
|
2016-07-05 17:27:44 +08:00
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(n->dev);
|
2016-07-05 17:27:44 +08:00
|
|
|
if (!mlxsw_sp_port)
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
2017-11-03 00:14:07 +08:00
|
|
|
net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
|
|
|
|
if (!net_work) {
|
2016-07-05 17:27:44 +08:00
|
|
|
mlxsw_sp_port_dev_put(mlxsw_sp_port);
|
2017-02-06 23:20:13 +08:00
|
|
|
return NOTIFY_BAD;
|
2016-07-05 17:27:44 +08:00
|
|
|
}
|
2017-02-06 23:20:13 +08:00
|
|
|
|
2017-11-03 00:14:07 +08:00
|
|
|
INIT_WORK(&net_work->work, mlxsw_sp_router_neigh_event_work);
|
|
|
|
net_work->mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
|
|
|
|
net_work->n = n;
|
2016-07-05 17:27:44 +08:00
|
|
|
|
|
|
|
/* Take a reference to ensure the neighbour won't be
|
|
|
|
* destructed until we drop the reference in delayed
|
|
|
|
* work.
|
|
|
|
*/
|
|
|
|
neigh_clone(n);
|
2017-11-03 00:14:07 +08:00
|
|
|
mlxsw_core_schedule_work(&net_work->work);
|
2017-02-06 23:20:13 +08:00
|
|
|
mlxsw_sp_port_dev_put(mlxsw_sp_port);
|
2016-07-05 17:27:44 +08:00
|
|
|
break;
|
2018-03-03 00:32:16 +08:00
|
|
|
case NETEVENT_IPV4_MPATH_HASH_UPDATE:
|
2018-03-03 00:32:19 +08:00
|
|
|
case NETEVENT_IPV6_MPATH_HASH_UPDATE:
|
2018-08-01 06:37:36 +08:00
|
|
|
return mlxsw_sp_router_schedule_work(ptr, nb,
|
|
|
|
mlxsw_sp_router_mp_hash_event_work);
|
2017-11-03 00:14:10 +08:00
|
|
|
|
2018-08-01 06:38:03 +08:00
|
|
|
case NETEVENT_IPV4_FWD_UPDATE_PRIORITY_UPDATE:
|
|
|
|
return mlxsw_sp_router_schedule_work(ptr, nb,
|
|
|
|
mlxsw_sp_router_update_priority_work);
|
2016-07-05 17:27:43 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:39 +08:00
|
|
|
static int mlxsw_sp_neigh_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2016-07-05 17:27:43 +08:00
|
|
|
int err;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
err = rhashtable_init(&mlxsw_sp->router->neigh_ht,
|
2016-07-05 17:27:43 +08:00
|
|
|
&mlxsw_sp_neigh_ht_params);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
/* Initialize the polling interval according to the default
|
|
|
|
* table.
|
|
|
|
*/
|
|
|
|
mlxsw_sp_router_neighs_update_interval_init(mlxsw_sp);
|
|
|
|
|
2016-07-05 17:27:52 +08:00
|
|
|
/* Create the delayed works for the activity_update */
|
2017-05-17 01:38:25 +08:00
|
|
|
INIT_DELAYED_WORK(&mlxsw_sp->router->neighs_update.dw,
|
2016-07-05 17:27:43 +08:00
|
|
|
mlxsw_sp_router_neighs_update_work);
|
2017-05-17 01:38:25 +08:00
|
|
|
INIT_DELAYED_WORK(&mlxsw_sp->router->nexthop_probe_dw,
|
2016-07-05 17:27:52 +08:00
|
|
|
mlxsw_sp_router_probe_unresolved_nexthops);
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw, 0);
|
|
|
|
mlxsw_core_schedule_dw(&mlxsw_sp->router->nexthop_probe_dw, 0);
|
2016-07-05 17:27:43 +08:00
|
|
|
return 0;
|
2016-07-05 17:27:39 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_neigh_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
cancel_delayed_work_sync(&mlxsw_sp->router->neighs_update.dw);
|
|
|
|
cancel_delayed_work_sync(&mlxsw_sp->router->nexthop_probe_dw);
|
|
|
|
rhashtable_destroy(&mlxsw_sp->router->neigh_ht);
|
2016-07-05 17:27:39 +08:00
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:42 +08:00
|
|
|
static void mlxsw_sp_neigh_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif)
|
2017-02-08 18:16:42 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry, *tmp;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
list_for_each_entry_safe(neigh_entry, tmp, &rif->neigh_list,
|
2017-12-18 00:16:43 +08:00
|
|
|
rif_list_node) {
|
|
|
|
mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, false);
|
2017-02-08 18:16:42 +08:00
|
|
|
mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
|
2017-12-18 00:16:43 +08:00
|
|
|
}
|
2017-02-08 18:16:42 +08:00
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
enum mlxsw_sp_nexthop_type {
|
|
|
|
MLXSW_SP_NEXTHOP_TYPE_ETH,
|
2017-09-03 05:49:23 +08:00
|
|
|
MLXSW_SP_NEXTHOP_TYPE_IPIP,
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
};
|
|
|
|
|
2017-02-08 18:16:30 +08:00
|
|
|
struct mlxsw_sp_nexthop_key {
|
|
|
|
struct fib_nh *fib_nh;
|
|
|
|
};
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
struct mlxsw_sp_nexthop {
|
|
|
|
struct list_head neigh_list_node; /* member of neigh entry list */
|
2017-02-08 18:16:42 +08:00
|
|
|
struct list_head rif_list_node;
|
2017-09-25 16:32:23 +08:00
|
|
|
struct list_head router_list_node;
|
2016-07-05 17:27:50 +08:00
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp; /* pointer back to the group
|
|
|
|
* this belongs to
|
|
|
|
*/
|
2017-02-08 18:16:30 +08:00
|
|
|
struct rhash_head ht_node;
|
|
|
|
struct mlxsw_sp_nexthop_key key;
|
2017-07-18 16:10:19 +08:00
|
|
|
unsigned char gw_addr[sizeof(struct in6_addr)];
|
2017-08-15 03:09:20 +08:00
|
|
|
int ifindex;
|
2017-10-23 05:11:46 +08:00
|
|
|
int nh_weight;
|
2017-10-23 05:11:48 +08:00
|
|
|
int norm_nh_weight;
|
|
|
|
int num_adj_entries;
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2016-07-05 17:27:50 +08:00
|
|
|
u8 should_offload:1, /* set indicates this neigh is connected and
|
|
|
|
* should be put to KVD linear area of this group.
|
|
|
|
*/
|
|
|
|
offloaded:1, /* set in case the neigh is actually put into
|
|
|
|
* KVD linear area of this group.
|
|
|
|
*/
|
|
|
|
update:1; /* set indicates that MAC of this neigh should be
|
|
|
|
* updated in HW
|
|
|
|
*/
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
enum mlxsw_sp_nexthop_type type;
|
|
|
|
union {
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
2017-09-03 05:49:23 +08:00
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
};
|
2017-09-25 16:32:28 +08:00
|
|
|
unsigned int counter_index;
|
|
|
|
bool counter_valid;
|
2016-07-05 17:27:50 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlxsw_sp_nexthop_group {
|
2017-08-15 03:09:19 +08:00
|
|
|
void *priv;
|
2017-02-08 18:16:29 +08:00
|
|
|
struct rhash_head ht_node;
|
2016-07-05 17:27:50 +08:00
|
|
|
struct list_head fib_list; /* list of fib entries that use this group */
|
2017-07-18 16:10:19 +08:00
|
|
|
struct neigh_table *neigh_tbl;
|
2017-02-08 18:16:32 +08:00
|
|
|
u8 adj_index_valid:1,
|
|
|
|
gateway:1; /* routes using the group use a gateway */
|
2016-07-05 17:27:50 +08:00
|
|
|
u32 adj_index;
|
|
|
|
u16 ecmp_size;
|
|
|
|
u16 count;
|
2017-10-23 05:11:48 +08:00
|
|
|
int sum_norm_weight;
|
2016-07-05 17:27:50 +08:00
|
|
|
struct mlxsw_sp_nexthop nexthops[0];
|
2017-03-17 16:38:00 +08:00
|
|
|
#define nh_rif nexthops[0].rif
|
2016-07-05 17:27:50 +08:00
|
|
|
};
|
|
|
|
|
2017-09-25 16:32:30 +08:00
|
|
|
void mlxsw_sp_nexthop_counter_alloc(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2017-09-25 16:32:28 +08:00
|
|
|
{
|
|
|
|
struct devlink *devlink;
|
|
|
|
|
|
|
|
devlink = priv_to_devlink(mlxsw_sp->core);
|
|
|
|
if (!devlink_dpipe_table_counter_enabled(devlink,
|
|
|
|
MLXSW_SP_DPIPE_TABLE_NAME_ADJ))
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &nh->counter_index))
|
|
|
|
return;
|
|
|
|
|
|
|
|
nh->counter_valid = true;
|
|
|
|
}
|
|
|
|
|
2017-09-25 16:32:30 +08:00
|
|
|
void mlxsw_sp_nexthop_counter_free(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2017-09-25 16:32:28 +08:00
|
|
|
{
|
|
|
|
if (!nh->counter_valid)
|
|
|
|
return;
|
|
|
|
mlxsw_sp_flow_counter_free(mlxsw_sp, nh->counter_index);
|
|
|
|
nh->counter_valid = false;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mlxsw_sp_nexthop_counter_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh, u64 *p_counter)
|
|
|
|
{
|
|
|
|
if (!nh->counter_valid)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
return mlxsw_sp_flow_counter_get(mlxsw_sp, nh->counter_index,
|
|
|
|
p_counter, NULL);
|
|
|
|
}
|
|
|
|
|
2017-09-25 16:32:25 +08:00
|
|
|
struct mlxsw_sp_nexthop *mlxsw_sp_nexthop_next(struct mlxsw_sp_router *router,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
if (!nh) {
|
|
|
|
if (list_empty(&router->nexthop_list))
|
|
|
|
return NULL;
|
|
|
|
else
|
|
|
|
return list_first_entry(&router->nexthop_list,
|
|
|
|
typeof(*nh), router_list_node);
|
|
|
|
}
|
|
|
|
if (list_is_last(&nh->router_list_node, &router->nexthop_list))
|
|
|
|
return NULL;
|
|
|
|
return list_next_entry(nh, router_list_node);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool mlxsw_sp_nexthop_offload(struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
return nh->offloaded;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned char *mlxsw_sp_nexthop_ha(struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
if (!nh->offloaded)
|
|
|
|
return NULL;
|
|
|
|
return nh->neigh_entry->ha;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mlxsw_sp_nexthop_indexes(struct mlxsw_sp_nexthop *nh, u32 *p_adj_index,
|
2017-10-23 05:11:43 +08:00
|
|
|
u32 *p_adj_size, u32 *p_adj_hash_index)
|
2017-09-25 16:32:25 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp = nh->nh_grp;
|
|
|
|
u32 adj_hash_index = 0;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
if (!nh->offloaded || !nh_grp->adj_index_valid)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
*p_adj_index = nh_grp->adj_index;
|
2017-10-23 05:11:43 +08:00
|
|
|
*p_adj_size = nh_grp->ecmp_size;
|
2017-09-25 16:32:25 +08:00
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
struct mlxsw_sp_nexthop *nh_iter = &nh_grp->nexthops[i];
|
|
|
|
|
|
|
|
if (nh_iter == nh)
|
|
|
|
break;
|
|
|
|
if (nh_iter->offloaded)
|
2017-10-23 05:11:48 +08:00
|
|
|
adj_hash_index += nh_iter->num_adj_entries;
|
2017-09-25 16:32:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
*p_adj_hash_index = adj_hash_index;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct mlxsw_sp_rif *mlxsw_sp_nexthop_rif(struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
return nh->rif;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool mlxsw_sp_nexthop_group_has_ipip(struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp = nh->nh_grp;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
struct mlxsw_sp_nexthop *nh_iter = &nh_grp->nexthops[i];
|
|
|
|
|
|
|
|
if (nh_iter->type == MLXSW_SP_NEXTHOP_TYPE_IPIP)
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-08-15 03:09:19 +08:00
|
|
|
static struct fib_info *
|
|
|
|
mlxsw_sp_nexthop4_group_fi(const struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
return nh_grp->priv;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct mlxsw_sp_nexthop_group_cmp_arg {
|
2017-08-15 03:09:20 +08:00
|
|
|
enum mlxsw_sp_l3proto proto;
|
|
|
|
union {
|
|
|
|
struct fib_info *fi;
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
};
|
2017-08-15 03:09:19 +08:00
|
|
|
};
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
static bool
|
|
|
|
mlxsw_sp_nexthop6_group_has_nexthop(const struct mlxsw_sp_nexthop_group *nh_grp,
|
2018-01-13 00:15:59 +08:00
|
|
|
const struct in6_addr *gw, int ifindex,
|
|
|
|
int weight)
|
2017-08-15 03:09:20 +08:00
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
const struct mlxsw_sp_nexthop *nh;
|
|
|
|
|
|
|
|
nh = &nh_grp->nexthops[i];
|
2018-01-13 00:15:59 +08:00
|
|
|
if (nh->ifindex == ifindex && nh->nh_weight == weight &&
|
2017-08-15 03:09:20 +08:00
|
|
|
ipv6_addr_equal(gw, (struct in6_addr *) nh->gw_addr))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool
|
|
|
|
mlxsw_sp_nexthop6_group_cmp(const struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
const struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
|
|
|
|
if (nh_grp->count != fib6_entry->nrt6)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
|
2019-05-23 11:27:59 +08:00
|
|
|
struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh;
|
2017-08-15 03:09:20 +08:00
|
|
|
struct in6_addr *gw;
|
2018-01-13 00:15:59 +08:00
|
|
|
int ifindex, weight;
|
2017-08-15 03:09:20 +08:00
|
|
|
|
2019-03-28 11:53:56 +08:00
|
|
|
ifindex = fib6_nh->fib_nh_dev->ifindex;
|
|
|
|
weight = fib6_nh->fib_nh_weight;
|
|
|
|
gw = &fib6_nh->fib_nh_gw6;
|
2018-01-13 00:15:59 +08:00
|
|
|
if (!mlxsw_sp_nexthop6_group_has_nexthop(nh_grp, gw, ifindex,
|
|
|
|
weight))
|
2017-08-15 03:09:20 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2017-08-15 03:09:19 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_nexthop_group_cmp(struct rhashtable_compare_arg *arg, const void *ptr)
|
|
|
|
{
|
|
|
|
const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = arg->key;
|
|
|
|
const struct mlxsw_sp_nexthop_group *nh_grp = ptr;
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
switch (cmp_arg->proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
return cmp_arg->fi != mlxsw_sp_nexthop4_group_fi(nh_grp);
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
return !mlxsw_sp_nexthop6_group_cmp(nh_grp,
|
|
|
|
cmp_arg->fib6_entry);
|
|
|
|
default:
|
|
|
|
WARN_ON(1);
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_nexthop_group_type(const struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
return nh_grp->neigh_tbl->family;
|
2017-08-15 03:09:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static u32 mlxsw_sp_nexthop_group_hash_obj(const void *data, u32 len, u32 seed)
|
|
|
|
{
|
|
|
|
const struct mlxsw_sp_nexthop_group *nh_grp = data;
|
2017-08-15 03:09:20 +08:00
|
|
|
const struct mlxsw_sp_nexthop *nh;
|
|
|
|
struct fib_info *fi;
|
|
|
|
unsigned int val;
|
|
|
|
int i;
|
2017-08-15 03:09:19 +08:00
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
switch (mlxsw_sp_nexthop_group_type(nh_grp)) {
|
|
|
|
case AF_INET:
|
|
|
|
fi = mlxsw_sp_nexthop4_group_fi(nh_grp);
|
|
|
|
return jhash(&fi, sizeof(fi), seed);
|
|
|
|
case AF_INET6:
|
|
|
|
val = nh_grp->count;
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
2019-07-23 15:57:42 +08:00
|
|
|
val ^= jhash(&nh->ifindex, sizeof(nh->ifindex), seed);
|
2017-08-15 03:09:20 +08:00
|
|
|
}
|
|
|
|
return jhash(&val, sizeof(val), seed);
|
|
|
|
default:
|
|
|
|
WARN_ON(1);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static u32
|
|
|
|
mlxsw_sp_nexthop6_group_hash(struct mlxsw_sp_fib6_entry *fib6_entry, u32 seed)
|
|
|
|
{
|
|
|
|
unsigned int val = fib6_entry->nrt6;
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
struct net_device *dev;
|
|
|
|
|
|
|
|
list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
|
2019-05-23 11:27:59 +08:00
|
|
|
dev = mlxsw_sp_rt6->rt->fib6_nh->fib_nh_dev;
|
2019-07-23 15:57:42 +08:00
|
|
|
val ^= jhash(&dev->ifindex, sizeof(dev->ifindex), seed);
|
2017-08-15 03:09:20 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return jhash(&val, sizeof(val), seed);
|
2017-08-15 03:09:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static u32
|
|
|
|
mlxsw_sp_nexthop_group_hash(const void *data, u32 len, u32 seed)
|
|
|
|
{
|
|
|
|
const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = data;
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
switch (cmp_arg->proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
return jhash(&cmp_arg->fi, sizeof(cmp_arg->fi), seed);
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
return mlxsw_sp_nexthop6_group_hash(cmp_arg->fib6_entry, seed);
|
|
|
|
default:
|
|
|
|
WARN_ON(1);
|
|
|
|
return 0;
|
|
|
|
}
|
2017-08-15 03:09:19 +08:00
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:29 +08:00
|
|
|
static const struct rhashtable_params mlxsw_sp_nexthop_group_ht_params = {
|
|
|
|
.head_offset = offsetof(struct mlxsw_sp_nexthop_group, ht_node),
|
2017-08-15 03:09:19 +08:00
|
|
|
.hashfn = mlxsw_sp_nexthop_group_hash,
|
|
|
|
.obj_hashfn = mlxsw_sp_nexthop_group_hash_obj,
|
|
|
|
.obj_cmpfn = mlxsw_sp_nexthop_group_cmp,
|
2017-02-08 18:16:29 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static int mlxsw_sp_nexthop_group_insert(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
2017-08-15 03:09:20 +08:00
|
|
|
if (mlxsw_sp_nexthop_group_type(nh_grp) == AF_INET6 &&
|
|
|
|
!nh_grp->gateway)
|
|
|
|
return 0;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_group_ht,
|
2017-02-08 18:16:29 +08:00
|
|
|
&nh_grp->ht_node,
|
|
|
|
mlxsw_sp_nexthop_group_ht_params);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_nexthop_group_remove(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
2017-08-15 03:09:20 +08:00
|
|
|
if (mlxsw_sp_nexthop_group_type(nh_grp) == AF_INET6 &&
|
|
|
|
!nh_grp->gateway)
|
|
|
|
return;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
rhashtable_remove_fast(&mlxsw_sp->router->nexthop_group_ht,
|
2017-02-08 18:16:29 +08:00
|
|
|
&nh_grp->ht_node,
|
|
|
|
mlxsw_sp_nexthop_group_ht_params);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_nexthop_group *
|
2017-08-15 03:09:19 +08:00
|
|
|
mlxsw_sp_nexthop4_group_lookup(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct fib_info *fi)
|
2017-02-08 18:16:29 +08:00
|
|
|
{
|
2017-08-15 03:09:19 +08:00
|
|
|
struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg;
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
cmp_arg.proto = MLXSW_SP_L3_PROTO_IPV4;
|
2017-08-15 03:09:19 +08:00
|
|
|
cmp_arg.fi = fi;
|
|
|
|
return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht,
|
|
|
|
&cmp_arg,
|
2017-02-08 18:16:29 +08:00
|
|
|
mlxsw_sp_nexthop_group_ht_params);
|
|
|
|
}
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
static struct mlxsw_sp_nexthop_group *
|
|
|
|
mlxsw_sp_nexthop6_group_lookup(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg;
|
|
|
|
|
|
|
|
cmp_arg.proto = MLXSW_SP_L3_PROTO_IPV6;
|
|
|
|
cmp_arg.fib6_entry = fib6_entry;
|
|
|
|
return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht,
|
|
|
|
&cmp_arg,
|
|
|
|
mlxsw_sp_nexthop_group_ht_params);
|
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:30 +08:00
|
|
|
static const struct rhashtable_params mlxsw_sp_nexthop_ht_params = {
|
|
|
|
.key_offset = offsetof(struct mlxsw_sp_nexthop, key),
|
|
|
|
.head_offset = offsetof(struct mlxsw_sp_nexthop, ht_node),
|
|
|
|
.key_len = sizeof(struct mlxsw_sp_nexthop_key),
|
|
|
|
};
|
|
|
|
|
|
|
|
static int mlxsw_sp_nexthop_insert(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_ht,
|
2017-02-08 18:16:30 +08:00
|
|
|
&nh->ht_node, mlxsw_sp_nexthop_ht_params);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_nexthop_remove(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
rhashtable_remove_fast(&mlxsw_sp->router->nexthop_ht, &nh->ht_node,
|
2017-02-08 18:16:30 +08:00
|
|
|
mlxsw_sp_nexthop_ht_params);
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
static struct mlxsw_sp_nexthop *
|
|
|
|
mlxsw_sp_nexthop_lookup(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_key key)
|
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_ht, &key,
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
mlxsw_sp_nexthop_ht_params);
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
static int mlxsw_sp_adj_index_mass_update_vr(struct mlxsw_sp *mlxsw_sp,
|
2017-03-10 15:53:41 +08:00
|
|
|
const struct mlxsw_sp_fib *fib,
|
2016-07-05 17:27:50 +08:00
|
|
|
u32 adj_index, u16 ecmp_size,
|
|
|
|
u32 new_adj_index,
|
|
|
|
u16 new_ecmp_size)
|
|
|
|
{
|
|
|
|
char raleu_pl[MLXSW_REG_RALEU_LEN];
|
|
|
|
|
2016-09-19 14:29:26 +08:00
|
|
|
mlxsw_reg_raleu_pack(raleu_pl,
|
2017-03-10 15:53:41 +08:00
|
|
|
(enum mlxsw_reg_ralxx_protocol) fib->proto,
|
|
|
|
fib->vr->id, adj_index, ecmp_size, new_adj_index,
|
2016-09-19 14:29:26 +08:00
|
|
|
new_ecmp_size);
|
2016-07-05 17:27:50 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raleu), raleu_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_adj_index_mass_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
u32 old_adj_index, u16 old_ecmp_size)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib = NULL;
|
2016-07-05 17:27:50 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
|
2017-03-10 15:53:41 +08:00
|
|
|
if (fib == fib_entry->fib_node->fib)
|
2016-07-05 17:27:50 +08:00
|
|
|
continue;
|
2017-03-10 15:53:41 +08:00
|
|
|
fib = fib_entry->fib_node->fib;
|
|
|
|
err = mlxsw_sp_adj_index_mass_update_vr(mlxsw_sp, fib,
|
2016-07-05 17:27:50 +08:00
|
|
|
old_adj_index,
|
|
|
|
old_ecmp_size,
|
|
|
|
nh_grp->adj_index,
|
|
|
|
nh_grp->ecmp_size);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-10-23 05:11:48 +08:00
|
|
|
static int __mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry;
|
|
|
|
char ratr_pl[MLXSW_REG_RATR_LEN];
|
|
|
|
|
|
|
|
mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY,
|
2017-09-03 05:49:15 +08:00
|
|
|
true, MLXSW_REG_RATR_TYPE_ETHERNET,
|
|
|
|
adj_index, neigh_entry->rif);
|
2016-07-05 17:27:50 +08:00
|
|
|
mlxsw_reg_ratr_eth_entry_pack(ratr_pl, neigh_entry->ha);
|
2017-09-25 16:32:28 +08:00
|
|
|
if (nh->counter_valid)
|
|
|
|
mlxsw_reg_ratr_counter_pack(ratr_pl, nh->counter_index, true);
|
|
|
|
else
|
|
|
|
mlxsw_reg_ratr_counter_pack(ratr_pl, 0, false);
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl);
|
|
|
|
}
|
|
|
|
|
2017-10-23 05:11:48 +08:00
|
|
|
int mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < nh->num_adj_entries; i++) {
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = __mlxsw_sp_nexthop_update(mlxsw_sp, adj_index + i, nh);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int __mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
u32 adj_index,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2017-09-03 05:49:23 +08:00
|
|
|
{
|
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[nh->ipip_entry->ipipt];
|
|
|
|
return ipip_ops->nexthop_update(mlxsw_sp, adj_index, nh->ipip_entry);
|
|
|
|
}
|
|
|
|
|
2017-10-23 05:11:48 +08:00
|
|
|
static int mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
u32 adj_index,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < nh->num_adj_entries; i++) {
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = __mlxsw_sp_nexthop_ipip_update(mlxsw_sp, adj_index + i,
|
|
|
|
nh);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
static int
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
mlxsw_sp_nexthop_group_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
bool reallocate)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
u32 adj_index = nh_grp->adj_index; /* base */
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
int i;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
|
|
|
|
if (!nh->should_offload) {
|
|
|
|
nh->offloaded = 0;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2017-01-23 18:11:42 +08:00
|
|
|
if (nh->update || reallocate) {
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
switch (nh->type) {
|
|
|
|
case MLXSW_SP_NEXTHOP_TYPE_ETH:
|
2017-09-25 16:32:28 +08:00
|
|
|
err = mlxsw_sp_nexthop_update
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
(mlxsw_sp, adj_index, nh);
|
|
|
|
break;
|
2017-09-03 05:49:23 +08:00
|
|
|
case MLXSW_SP_NEXTHOP_TYPE_IPIP:
|
|
|
|
err = mlxsw_sp_nexthop_ipip_update
|
|
|
|
(mlxsw_sp, adj_index, nh);
|
|
|
|
break;
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
}
|
2016-07-05 17:27:50 +08:00
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
nh->update = 0;
|
|
|
|
nh->offloaded = 1;
|
|
|
|
}
|
2017-10-23 05:11:48 +08:00
|
|
|
adj_index += nh->num_adj_entries;
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_nexthop_fib_entries_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
|
|
|
|
err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-10-23 05:11:47 +08:00
|
|
|
static void mlxsw_sp_adj_grp_size_round_up(u16 *p_adj_grp_size)
|
|
|
|
{
|
|
|
|
/* Valid sizes for an adjacency group are:
|
|
|
|
* 1-64, 512, 1024, 2048 and 4096.
|
|
|
|
*/
|
|
|
|
if (*p_adj_grp_size <= 64)
|
|
|
|
return;
|
|
|
|
else if (*p_adj_grp_size <= 512)
|
|
|
|
*p_adj_grp_size = 512;
|
|
|
|
else if (*p_adj_grp_size <= 1024)
|
|
|
|
*p_adj_grp_size = 1024;
|
|
|
|
else if (*p_adj_grp_size <= 2048)
|
|
|
|
*p_adj_grp_size = 2048;
|
|
|
|
else
|
|
|
|
*p_adj_grp_size = 4096;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_adj_grp_size_round_down(u16 *p_adj_grp_size,
|
|
|
|
unsigned int alloc_size)
|
|
|
|
{
|
|
|
|
if (alloc_size >= 4096)
|
|
|
|
*p_adj_grp_size = 4096;
|
|
|
|
else if (alloc_size >= 2048)
|
|
|
|
*p_adj_grp_size = 2048;
|
|
|
|
else if (alloc_size >= 1024)
|
|
|
|
*p_adj_grp_size = 1024;
|
|
|
|
else if (alloc_size >= 512)
|
|
|
|
*p_adj_grp_size = 512;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_fix_adj_grp_size(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
u16 *p_adj_grp_size)
|
|
|
|
{
|
|
|
|
unsigned int alloc_size;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
/* Round up the requested group size to the next size supported
|
|
|
|
* by the device and make sure the request can be satisfied.
|
|
|
|
*/
|
|
|
|
mlxsw_sp_adj_grp_size_round_up(p_adj_grp_size);
|
2018-07-09 04:51:17 +08:00
|
|
|
err = mlxsw_sp_kvdl_alloc_count_query(mlxsw_sp,
|
|
|
|
MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
|
|
|
|
*p_adj_grp_size, &alloc_size);
|
2017-10-23 05:11:47 +08:00
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
/* It is possible the allocation results in more allocated
|
|
|
|
* entries than requested. Try to use as much of them as
|
|
|
|
* possible.
|
|
|
|
*/
|
|
|
|
mlxsw_sp_adj_grp_size_round_down(p_adj_grp_size, alloc_size);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-10-23 05:11:48 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop_group_normalize(struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
int i, g = 0, sum_norm_weight = 0;
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
|
|
|
|
if (!nh->should_offload)
|
|
|
|
continue;
|
|
|
|
if (g > 0)
|
|
|
|
g = gcd(nh->nh_weight, g);
|
|
|
|
else
|
|
|
|
g = nh->nh_weight;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
|
|
|
|
if (!nh->should_offload)
|
|
|
|
continue;
|
|
|
|
nh->norm_nh_weight = nh->nh_weight / g;
|
|
|
|
sum_norm_weight += nh->norm_nh_weight;
|
|
|
|
}
|
|
|
|
|
|
|
|
nh_grp->sum_norm_weight = sum_norm_weight;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop_group_rebalance(struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
int total = nh_grp->sum_norm_weight;
|
|
|
|
u16 ecmp_size = nh_grp->ecmp_size;
|
|
|
|
int i, weight = 0, lower_bound = 0;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
|
|
|
|
int upper_bound;
|
|
|
|
|
|
|
|
if (!nh->should_offload)
|
|
|
|
continue;
|
|
|
|
weight += nh->norm_nh_weight;
|
|
|
|
upper_bound = DIV_ROUND_CLOSEST(ecmp_size * weight, total);
|
|
|
|
nh->num_adj_entries = upper_bound - lower_bound;
|
|
|
|
lower_bound = upper_bound;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-01-14 19:23:13 +08:00
|
|
|
static struct mlxsw_sp_nexthop *
|
|
|
|
mlxsw_sp_rt6_nexthop(struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
const struct mlxsw_sp_rt6 *mlxsw_sp_rt6);
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop4_group_offload_refresh(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
|
|
|
|
|
|
|
|
if (nh->offloaded)
|
|
|
|
nh->key.fib_nh->fib_nh_flags |= RTNH_F_OFFLOAD;
|
|
|
|
else
|
|
|
|
nh->key.fib_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
__mlxsw_sp_nexthop6_group_offload_refresh(struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
|
|
|
|
list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
|
|
|
|
struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh;
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
|
|
|
|
nh = mlxsw_sp_rt6_nexthop(nh_grp, mlxsw_sp_rt6);
|
|
|
|
if (nh && nh->offloaded)
|
|
|
|
fib6_nh->fib_nh_flags |= RTNH_F_OFFLOAD;
|
|
|
|
else
|
|
|
|
fib6_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop6_group_offload_refresh(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
|
|
|
|
/* Unfortunately, in IPv6 the route and the nexthop are described by
|
|
|
|
* the same struct, so we need to iterate over all the routes using the
|
|
|
|
* nexthop group and set / clear the offload indication for them.
|
|
|
|
*/
|
|
|
|
list_for_each_entry(fib6_entry, &nh_grp->fib_list,
|
|
|
|
common.nexthop_group_node)
|
|
|
|
__mlxsw_sp_nexthop6_group_offload_refresh(nh_grp, fib6_entry);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop_group_offload_refresh(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
switch (mlxsw_sp_nexthop_group_type(nh_grp)) {
|
|
|
|
case AF_INET:
|
|
|
|
mlxsw_sp_nexthop4_group_offload_refresh(mlxsw_sp, nh_grp);
|
|
|
|
break;
|
|
|
|
case AF_INET6:
|
|
|
|
mlxsw_sp_nexthop6_group_offload_refresh(mlxsw_sp, nh_grp);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop_group_refresh(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
2017-10-23 05:11:48 +08:00
|
|
|
u16 ecmp_size, old_ecmp_size;
|
2016-07-05 17:27:50 +08:00
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
bool offload_change = false;
|
|
|
|
u32 adj_index;
|
|
|
|
bool old_adj_index_valid;
|
|
|
|
u32 old_adj_index;
|
|
|
|
int i;
|
|
|
|
int err;
|
|
|
|
|
2017-02-08 18:16:32 +08:00
|
|
|
if (!nh_grp->gateway) {
|
|
|
|
mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
|
2017-07-31 15:27:29 +08:00
|
|
|
if (nh->should_offload != nh->offloaded) {
|
2016-07-05 17:27:50 +08:00
|
|
|
offload_change = true;
|
|
|
|
if (nh->should_offload)
|
|
|
|
nh->update = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!offload_change) {
|
|
|
|
/* Nothing was added or removed, so no need to reallocate. Just
|
|
|
|
* update MAC on existing adjacency indexes.
|
|
|
|
*/
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nh_grp, false);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (err) {
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n");
|
|
|
|
goto set_trap;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
2017-10-23 05:11:48 +08:00
|
|
|
mlxsw_sp_nexthop_group_normalize(nh_grp);
|
|
|
|
if (!nh_grp->sum_norm_weight)
|
2016-07-05 17:27:50 +08:00
|
|
|
/* No neigh of this group is connected so we just set
|
|
|
|
* the trap and let everthing flow through kernel.
|
|
|
|
*/
|
|
|
|
goto set_trap;
|
|
|
|
|
2017-10-23 05:11:48 +08:00
|
|
|
ecmp_size = nh_grp->sum_norm_weight;
|
2017-10-23 05:11:47 +08:00
|
|
|
err = mlxsw_sp_fix_adj_grp_size(mlxsw_sp, &ecmp_size);
|
|
|
|
if (err)
|
|
|
|
/* No valid allocation size available. */
|
|
|
|
goto set_trap;
|
|
|
|
|
2018-07-09 04:51:17 +08:00
|
|
|
err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
|
|
|
|
ecmp_size, &adj_index);
|
2017-03-25 15:28:22 +08:00
|
|
|
if (err) {
|
2016-07-05 17:27:50 +08:00
|
|
|
/* We ran out of KVD linear space, just set the
|
|
|
|
* trap and let everything flow through kernel.
|
|
|
|
*/
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to allocate KVD linear area for nexthop group.\n");
|
|
|
|
goto set_trap;
|
|
|
|
}
|
|
|
|
old_adj_index_valid = nh_grp->adj_index_valid;
|
|
|
|
old_adj_index = nh_grp->adj_index;
|
|
|
|
old_ecmp_size = nh_grp->ecmp_size;
|
|
|
|
nh_grp->adj_index_valid = 1;
|
|
|
|
nh_grp->adj_index = adj_index;
|
|
|
|
nh_grp->ecmp_size = ecmp_size;
|
2017-10-23 05:11:48 +08:00
|
|
|
mlxsw_sp_nexthop_group_rebalance(nh_grp);
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nh_grp, true);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (err) {
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n");
|
|
|
|
goto set_trap;
|
|
|
|
}
|
|
|
|
|
2020-01-14 19:23:13 +08:00
|
|
|
mlxsw_sp_nexthop_group_offload_refresh(mlxsw_sp, nh_grp);
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
if (!old_adj_index_valid) {
|
|
|
|
/* The trap was set for fib entries, so we have to call
|
|
|
|
* fib entry update to unset it and use adjacency index.
|
|
|
|
*/
|
|
|
|
err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
|
|
|
|
if (err) {
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to add adjacency index to fib entries.\n");
|
|
|
|
goto set_trap;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
err = mlxsw_sp_adj_index_mass_update(mlxsw_sp, nh_grp,
|
|
|
|
old_adj_index, old_ecmp_size);
|
2018-07-09 04:51:17 +08:00
|
|
|
mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
|
2018-07-09 04:51:18 +08:00
|
|
|
old_ecmp_size, old_adj_index);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (err) {
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to mass-update adjacency index for nexthop group.\n");
|
|
|
|
goto set_trap;
|
|
|
|
}
|
2017-08-02 15:56:05 +08:00
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
set_trap:
|
|
|
|
old_adj_index_valid = nh_grp->adj_index_valid;
|
|
|
|
nh_grp->adj_index_valid = 0;
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
nh->offloaded = 0;
|
|
|
|
}
|
|
|
|
err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
|
|
|
|
if (err)
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to set traps for fib entries.\n");
|
2020-01-14 19:23:13 +08:00
|
|
|
mlxsw_sp_nexthop_group_offload_refresh(mlxsw_sp, nh_grp);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (old_adj_index_valid)
|
2018-07-09 04:51:17 +08:00
|
|
|
mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
|
2018-07-09 04:51:18 +08:00
|
|
|
nh_grp->ecmp_size, nh_grp->adj_index);
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void __mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp_nexthop *nh,
|
|
|
|
bool removing)
|
|
|
|
{
|
2017-07-31 15:27:30 +08:00
|
|
|
if (!removing)
|
2016-07-05 17:27:50 +08:00
|
|
|
nh->should_offload = 1;
|
2017-12-25 15:57:35 +08:00
|
|
|
else
|
2016-07-05 17:27:50 +08:00
|
|
|
nh->should_offload = 0;
|
|
|
|
nh->update = 1;
|
|
|
|
}
|
|
|
|
|
2019-06-11 15:19:41 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_nexthop_dead_neigh_replace(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry)
|
|
|
|
{
|
|
|
|
struct neighbour *n, *old_n = neigh_entry->key.n;
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
bool entry_connected;
|
|
|
|
u8 nud_state, dead;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
nh = list_first_entry(&neigh_entry->nexthop_list,
|
|
|
|
struct mlxsw_sp_nexthop, neigh_list_node);
|
|
|
|
|
|
|
|
n = neigh_lookup(nh->nh_grp->neigh_tbl, &nh->gw_addr, nh->rif->dev);
|
|
|
|
if (!n) {
|
|
|
|
n = neigh_create(nh->nh_grp->neigh_tbl, &nh->gw_addr,
|
|
|
|
nh->rif->dev);
|
|
|
|
if (IS_ERR(n))
|
|
|
|
return PTR_ERR(n);
|
|
|
|
neigh_event_send(n, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry);
|
|
|
|
neigh_entry->key.n = n;
|
|
|
|
err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
|
|
|
|
if (err)
|
|
|
|
goto err_neigh_entry_insert;
|
|
|
|
|
|
|
|
read_lock_bh(&n->lock);
|
|
|
|
nud_state = n->nud_state;
|
|
|
|
dead = n->dead;
|
|
|
|
read_unlock_bh(&n->lock);
|
|
|
|
entry_connected = nud_state & NUD_VALID && !dead;
|
|
|
|
|
|
|
|
list_for_each_entry(nh, &neigh_entry->nexthop_list,
|
|
|
|
neigh_list_node) {
|
|
|
|
neigh_release(old_n);
|
|
|
|
neigh_clone(n);
|
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, !entry_connected);
|
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
|
|
|
|
}
|
|
|
|
|
|
|
|
neigh_release(n);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_neigh_entry_insert:
|
|
|
|
neigh_entry->key.n = old_n;
|
|
|
|
mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
|
|
|
|
neigh_release(n);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry,
|
2019-06-11 15:19:41 +08:00
|
|
|
bool removing, bool dead)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
|
2019-06-11 15:19:41 +08:00
|
|
|
if (list_empty(&neigh_entry->nexthop_list))
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (dead) {
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_nexthop_dead_neigh_replace(mlxsw_sp,
|
|
|
|
neigh_entry);
|
|
|
|
if (err)
|
|
|
|
dev_err(mlxsw_sp->bus_info->dev, "Failed to replace dead neigh\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
list_for_each_entry(nh, &neigh_entry->nexthop_list,
|
|
|
|
neigh_list_node) {
|
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, removing);
|
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:42 +08:00
|
|
|
static void mlxsw_sp_nexthop_rif_init(struct mlxsw_sp_nexthop *nh,
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif)
|
2017-02-08 18:16:42 +08:00
|
|
|
{
|
2017-03-17 16:38:00 +08:00
|
|
|
if (nh->rif)
|
2017-02-08 18:16:42 +08:00
|
|
|
return;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
nh->rif = rif;
|
|
|
|
list_add(&nh->rif_list_node, &rif->nexthop_list);
|
2017-02-08 18:16:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_nexthop_rif_fini(struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
2017-03-17 16:38:00 +08:00
|
|
|
if (!nh->rif)
|
2017-02-08 18:16:42 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
list_del(&nh->rif_list_node);
|
2017-03-17 16:38:00 +08:00
|
|
|
nh->rif = NULL;
|
2017-02-08 18:16:42 +08:00
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:35 +08:00
|
|
|
static int mlxsw_sp_nexthop_neigh_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry;
|
|
|
|
struct neighbour *n;
|
2016-12-23 16:32:49 +08:00
|
|
|
u8 nud_state, dead;
|
2017-02-08 18:16:30 +08:00
|
|
|
int err;
|
|
|
|
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
if (!nh->nh_grp->gateway || nh->neigh_entry)
|
2017-02-08 18:16:33 +08:00
|
|
|
return 0;
|
|
|
|
|
2016-11-10 19:31:04 +08:00
|
|
|
/* Take a reference of neigh here ensuring that neigh would
|
2017-07-31 15:27:25 +08:00
|
|
|
* not be destructed before the nexthop entry is finished.
|
2016-11-10 19:31:04 +08:00
|
|
|
* The reference is taken either in neigh_lookup() or
|
2017-02-06 23:20:17 +08:00
|
|
|
* in neigh_create() in case n is not found.
|
2016-11-10 19:31:04 +08:00
|
|
|
*/
|
2017-07-18 16:10:19 +08:00
|
|
|
n = neigh_lookup(nh->nh_grp->neigh_tbl, &nh->gw_addr, nh->rif->dev);
|
2016-11-10 19:31:04 +08:00
|
|
|
if (!n) {
|
2017-07-18 16:10:19 +08:00
|
|
|
n = neigh_create(nh->nh_grp->neigh_tbl, &nh->gw_addr,
|
|
|
|
nh->rif->dev);
|
2017-02-08 18:16:35 +08:00
|
|
|
if (IS_ERR(n))
|
|
|
|
return PTR_ERR(n);
|
2016-07-05 17:27:50 +08:00
|
|
|
neigh_event_send(n, NULL);
|
2016-11-10 19:31:04 +08:00
|
|
|
}
|
|
|
|
neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n);
|
|
|
|
if (!neigh_entry) {
|
2017-02-06 23:20:13 +08:00
|
|
|
neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n);
|
|
|
|
if (IS_ERR(neigh_entry)) {
|
2017-02-08 18:16:30 +08:00
|
|
|
err = -EINVAL;
|
|
|
|
goto err_neigh_entry_create;
|
2017-02-06 23:20:13 +08:00
|
|
|
}
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
2016-07-05 17:27:51 +08:00
|
|
|
|
|
|
|
/* If that is the first nexthop connected to that neigh, add to
|
|
|
|
* nexthop_neighs_list
|
|
|
|
*/
|
|
|
|
if (list_empty(&neigh_entry->nexthop_list))
|
|
|
|
list_add_tail(&neigh_entry->nexthop_neighs_list_node,
|
2017-05-17 01:38:25 +08:00
|
|
|
&mlxsw_sp->router->nexthop_neighs_list);
|
2016-07-05 17:27:51 +08:00
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
nh->neigh_entry = neigh_entry;
|
|
|
|
list_add_tail(&nh->neigh_list_node, &neigh_entry->nexthop_list);
|
|
|
|
read_lock_bh(&n->lock);
|
|
|
|
nud_state = n->nud_state;
|
2016-12-23 16:32:49 +08:00
|
|
|
dead = n->dead;
|
2016-07-05 17:27:50 +08:00
|
|
|
read_unlock_bh(&n->lock);
|
2016-12-23 16:32:49 +08:00
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, !(nud_state & NUD_VALID && !dead));
|
2016-07-05 17:27:50 +08:00
|
|
|
|
|
|
|
return 0;
|
2017-02-08 18:16:30 +08:00
|
|
|
|
|
|
|
err_neigh_entry_create:
|
|
|
|
neigh_release(n);
|
|
|
|
return err;
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:35 +08:00
|
|
|
static void mlxsw_sp_nexthop_neigh_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry;
|
2017-02-08 18:16:35 +08:00
|
|
|
struct neighbour *n;
|
2016-07-05 17:27:50 +08:00
|
|
|
|
2017-02-08 18:16:33 +08:00
|
|
|
if (!neigh_entry)
|
2017-02-08 18:16:35 +08:00
|
|
|
return;
|
|
|
|
n = neigh_entry->key.n;
|
2017-02-08 18:16:33 +08:00
|
|
|
|
2016-12-23 16:32:50 +08:00
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, true);
|
2016-07-05 17:27:50 +08:00
|
|
|
list_del(&nh->neigh_list_node);
|
2017-02-08 18:16:28 +08:00
|
|
|
nh->neigh_entry = NULL;
|
2016-07-05 17:27:51 +08:00
|
|
|
|
|
|
|
/* If that is the last nexthop connected to that neigh, remove from
|
|
|
|
* nexthop_neighs_list
|
|
|
|
*/
|
2017-02-08 18:16:28 +08:00
|
|
|
if (list_empty(&neigh_entry->nexthop_list))
|
|
|
|
list_del(&neigh_entry->nexthop_neighs_list_node);
|
2016-07-05 17:27:51 +08:00
|
|
|
|
2017-02-06 23:20:13 +08:00
|
|
|
if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list))
|
|
|
|
mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
|
|
|
|
|
|
|
|
neigh_release(n);
|
2017-02-08 18:16:35 +08:00
|
|
|
}
|
2017-02-08 18:16:30 +08:00
|
|
|
|
2017-11-03 17:03:44 +08:00
|
|
|
static bool mlxsw_sp_ipip_netdev_ul_up(struct net_device *ol_dev)
|
|
|
|
{
|
2020-02-20 15:07:55 +08:00
|
|
|
struct net_device *ul_dev;
|
|
|
|
bool is_up;
|
|
|
|
|
|
|
|
rcu_read_lock();
|
|
|
|
ul_dev = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
|
|
|
|
is_up = ul_dev ? (ul_dev->flags & IFF_UP) : true;
|
|
|
|
rcu_read_unlock();
|
2017-11-03 17:03:44 +08:00
|
|
|
|
2020-02-20 15:07:55 +08:00
|
|
|
return is_up;
|
2017-11-03 17:03:44 +08:00
|
|
|
}
|
|
|
|
|
2017-11-28 20:17:13 +08:00
|
|
|
static void mlxsw_sp_nexthop_ipip_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh,
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry)
|
2017-09-03 05:49:23 +08:00
|
|
|
{
|
2017-11-03 17:03:44 +08:00
|
|
|
bool removing;
|
|
|
|
|
2017-09-03 05:49:23 +08:00
|
|
|
if (!nh->nh_grp->gateway || nh->ipip_entry)
|
2017-11-28 20:17:13 +08:00
|
|
|
return;
|
2017-09-03 05:49:23 +08:00
|
|
|
|
2017-11-28 20:17:13 +08:00
|
|
|
nh->ipip_entry = ipip_entry;
|
|
|
|
removing = !mlxsw_sp_ipip_netdev_ul_up(ipip_entry->ol_dev);
|
2017-11-03 17:03:44 +08:00
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, removing);
|
2017-11-28 20:17:13 +08:00
|
|
|
mlxsw_sp_nexthop_rif_init(nh, &ipip_entry->ol_lb->common);
|
2017-09-03 05:49:23 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_nexthop_ipip_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry = nh->ipip_entry;
|
|
|
|
|
|
|
|
if (!ipip_entry)
|
|
|
|
return;
|
|
|
|
|
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, true);
|
|
|
|
nh->ipip_entry = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool mlxsw_sp_nexthop4_ipip_type(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct fib_nh *fib_nh,
|
|
|
|
enum mlxsw_sp_ipip_type *p_ipipt)
|
|
|
|
{
|
2019-03-28 11:53:55 +08:00
|
|
|
struct net_device *dev = fib_nh->fib_nh_dev;
|
2017-09-03 05:49:23 +08:00
|
|
|
|
|
|
|
return dev &&
|
|
|
|
fib_nh->nh_parent->fib_type == RTN_UNICAST &&
|
|
|
|
mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, p_ipipt);
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
static void mlxsw_sp_nexthop_type_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
switch (nh->type) {
|
|
|
|
case MLXSW_SP_NEXTHOP_TYPE_ETH:
|
|
|
|
mlxsw_sp_nexthop_neigh_fini(mlxsw_sp, nh);
|
|
|
|
mlxsw_sp_nexthop_rif_fini(nh);
|
|
|
|
break;
|
2017-09-03 05:49:23 +08:00
|
|
|
case MLXSW_SP_NEXTHOP_TYPE_IPIP:
|
2017-10-02 18:14:57 +08:00
|
|
|
mlxsw_sp_nexthop_rif_fini(nh);
|
2017-09-03 05:49:23 +08:00
|
|
|
mlxsw_sp_nexthop_ipip_fini(mlxsw_sp, nh);
|
|
|
|
break;
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_nexthop4_type_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh,
|
|
|
|
struct fib_nh *fib_nh)
|
|
|
|
{
|
2017-11-28 20:17:13 +08:00
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
2019-03-28 11:53:55 +08:00
|
|
|
struct net_device *dev = fib_nh->fib_nh_dev;
|
2017-11-28 20:17:13 +08:00
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
int err;
|
|
|
|
|
2017-11-28 20:17:13 +08:00
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, dev);
|
|
|
|
if (ipip_entry) {
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
|
|
|
|
if (ipip_ops->can_offload(mlxsw_sp, dev,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV4)) {
|
|
|
|
nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP;
|
|
|
|
mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, ipip_entry);
|
|
|
|
return 0;
|
|
|
|
}
|
2017-09-03 05:49:23 +08:00
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH;
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!rif)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
mlxsw_sp_nexthop_rif_init(nh, rif);
|
|
|
|
err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh);
|
|
|
|
if (err)
|
|
|
|
goto err_neigh_init;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_neigh_init:
|
|
|
|
mlxsw_sp_nexthop_rif_fini(nh);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_nexthop4_type_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
static int mlxsw_sp_nexthop4_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
struct mlxsw_sp_nexthop *nh,
|
|
|
|
struct fib_nh *fib_nh)
|
2017-02-08 18:16:35 +08:00
|
|
|
{
|
2019-03-28 11:53:55 +08:00
|
|
|
struct net_device *dev = fib_nh->fib_nh_dev;
|
2017-02-08 21:36:49 +08:00
|
|
|
struct in_device *in_dev;
|
2017-02-08 18:16:35 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
nh->nh_grp = nh_grp;
|
|
|
|
nh->key.fib_nh = fib_nh;
|
2017-10-23 05:11:46 +08:00
|
|
|
#ifdef CONFIG_IP_ROUTE_MULTIPATH
|
2019-03-28 11:53:55 +08:00
|
|
|
nh->nh_weight = fib_nh->fib_nh_weight;
|
2017-10-23 05:11:46 +08:00
|
|
|
#else
|
|
|
|
nh->nh_weight = 1;
|
|
|
|
#endif
|
2019-03-28 11:53:55 +08:00
|
|
|
memcpy(&nh->gw_addr, &fib_nh->fib_nh_gw4, sizeof(fib_nh->fib_nh_gw4));
|
2017-02-08 18:16:35 +08:00
|
|
|
err = mlxsw_sp_nexthop_insert(mlxsw_sp, nh);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-09-25 16:32:28 +08:00
|
|
|
mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh);
|
2017-09-25 16:32:23 +08:00
|
|
|
list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list);
|
|
|
|
|
2017-03-10 15:53:38 +08:00
|
|
|
if (!dev)
|
|
|
|
return 0;
|
|
|
|
|
2020-02-20 15:07:53 +08:00
|
|
|
rcu_read_lock();
|
|
|
|
in_dev = __in_dev_get_rcu(dev);
|
2017-02-08 21:36:49 +08:00
|
|
|
if (in_dev && IN_DEV_IGNORE_ROUTES_WITH_LINKDOWN(in_dev) &&
|
2020-02-20 15:07:53 +08:00
|
|
|
fib_nh->fib_nh_flags & RTNH_F_LINKDOWN) {
|
|
|
|
rcu_read_unlock();
|
2017-02-08 21:36:49 +08:00
|
|
|
return 0;
|
2020-02-20 15:07:53 +08:00
|
|
|
}
|
|
|
|
rcu_read_unlock();
|
2017-02-08 21:36:49 +08:00
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
err = mlxsw_sp_nexthop4_type_init(mlxsw_sp, nh, fib_nh);
|
2017-02-08 18:16:35 +08:00
|
|
|
if (err)
|
|
|
|
goto err_nexthop_neigh_init;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_nexthop_neigh_init:
|
|
|
|
mlxsw_sp_nexthop_remove(mlxsw_sp, nh);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
static void mlxsw_sp_nexthop4_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
2017-02-08 18:16:35 +08:00
|
|
|
{
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
mlxsw_sp_nexthop4_type_fini(mlxsw_sp, nh);
|
2017-09-25 16:32:23 +08:00
|
|
|
list_del(&nh->router_list_node);
|
2017-09-25 16:32:28 +08:00
|
|
|
mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh);
|
2017-02-08 18:16:30 +08:00
|
|
|
mlxsw_sp_nexthop_remove(mlxsw_sp, nh);
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
static void mlxsw_sp_nexthop4_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
unsigned long event, struct fib_nh *fib_nh)
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_key key;
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
if (mlxsw_sp->router->aborted)
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
key.fib_nh = fib_nh;
|
|
|
|
nh = mlxsw_sp_nexthop_lookup(mlxsw_sp, key);
|
2019-12-14 23:53:14 +08:00
|
|
|
if (!nh)
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case FIB_EVENT_NH_ADD:
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
mlxsw_sp_nexthop4_type_init(mlxsw_sp, nh, fib_nh);
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
break;
|
|
|
|
case FIB_EVENT_NH_DEL:
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
mlxsw_sp_nexthop4_type_fini(mlxsw_sp, nh);
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
|
|
|
|
}
|
|
|
|
|
2017-11-03 17:03:38 +08:00
|
|
|
static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
2017-11-03 17:03:44 +08:00
|
|
|
bool removing;
|
2017-11-03 17:03:38 +08:00
|
|
|
|
|
|
|
list_for_each_entry(nh, &rif->nexthop_list, rif_list_node) {
|
2017-11-03 17:03:44 +08:00
|
|
|
switch (nh->type) {
|
|
|
|
case MLXSW_SP_NEXTHOP_TYPE_ETH:
|
|
|
|
removing = false;
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_NEXTHOP_TYPE_IPIP:
|
|
|
|
removing = !mlxsw_sp_ipip_netdev_ul_up(rif->dev);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
WARN_ON(1);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
__mlxsw_sp_nexthop_neigh_update(nh, removing);
|
2017-11-03 17:03:38 +08:00
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-28 20:17:14 +08:00
|
|
|
static void mlxsw_sp_nexthop_rif_migrate(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *old_rif,
|
|
|
|
struct mlxsw_sp_rif *new_rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
|
|
|
|
list_splice_init(&old_rif->nexthop_list, &new_rif->nexthop_list);
|
|
|
|
list_for_each_entry(nh, &new_rif->nexthop_list, rif_list_node)
|
|
|
|
nh->rif = new_rif;
|
|
|
|
mlxsw_sp_nexthop_rif_update(mlxsw_sp, new_rif);
|
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:42 +08:00
|
|
|
static void mlxsw_sp_nexthop_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif)
|
2017-02-08 18:16:42 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop *nh, *tmp;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
list_for_each_entry_safe(nh, tmp, &rif->nexthop_list, rif_list_node) {
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
|
2017-02-08 18:16:42 +08:00
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:20 +08:00
|
|
|
static bool mlxsw_sp_fi_is_gateway(const struct mlxsw_sp *mlxsw_sp,
|
2019-06-04 11:19:49 +08:00
|
|
|
struct fib_info *fi)
|
2017-09-03 05:49:20 +08:00
|
|
|
{
|
2019-06-04 11:19:49 +08:00
|
|
|
const struct fib_nh *nh = fib_info_nh(fi, 0);
|
|
|
|
|
|
|
|
return nh->fib_nh_scope == RT_SCOPE_LINK ||
|
|
|
|
mlxsw_sp_nexthop4_ipip_type(mlxsw_sp, nh, NULL);
|
2017-09-03 05:49:20 +08:00
|
|
|
}
|
|
|
|
|
2016-07-05 17:27:50 +08:00
|
|
|
static struct mlxsw_sp_nexthop_group *
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_group_create(struct mlxsw_sp *mlxsw_sp, struct fib_info *fi)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
2019-06-04 11:19:49 +08:00
|
|
|
unsigned int nhs = fib_info_num_path(fi);
|
2016-07-05 17:27:50 +08:00
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp;
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
struct fib_nh *fib_nh;
|
|
|
|
int i;
|
|
|
|
int err;
|
|
|
|
|
2019-06-04 11:19:49 +08:00
|
|
|
nh_grp = kzalloc(struct_size(nh_grp, nexthops, nhs), GFP_KERNEL);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (!nh_grp)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
2017-08-15 03:09:19 +08:00
|
|
|
nh_grp->priv = fi;
|
2016-07-05 17:27:50 +08:00
|
|
|
INIT_LIST_HEAD(&nh_grp->fib_list);
|
2017-07-18 16:10:19 +08:00
|
|
|
nh_grp->neigh_tbl = &arp_tbl;
|
|
|
|
|
2017-09-03 05:49:20 +08:00
|
|
|
nh_grp->gateway = mlxsw_sp_fi_is_gateway(mlxsw_sp, fi);
|
2019-06-04 11:19:49 +08:00
|
|
|
nh_grp->count = nhs;
|
2017-07-12 15:12:53 +08:00
|
|
|
fib_info_hold(fi);
|
2016-07-05 17:27:50 +08:00
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
2019-06-04 11:19:49 +08:00
|
|
|
fib_nh = fib_info_nh(fi, i);
|
2017-07-18 16:10:27 +08:00
|
|
|
err = mlxsw_sp_nexthop4_init(mlxsw_sp, nh_grp, nh, fib_nh);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (err)
|
2017-07-18 16:10:27 +08:00
|
|
|
goto err_nexthop4_init;
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
2017-02-08 18:16:29 +08:00
|
|
|
err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop_group_insert;
|
2016-07-05 17:27:50 +08:00
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
|
|
|
|
return nh_grp;
|
|
|
|
|
2017-02-08 18:16:29 +08:00
|
|
|
err_nexthop_group_insert:
|
2017-07-18 16:10:27 +08:00
|
|
|
err_nexthop4_init:
|
2017-02-08 21:36:49 +08:00
|
|
|
for (i--; i >= 0; i--) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_fini(mlxsw_sp, nh);
|
2017-02-08 21:36:49 +08:00
|
|
|
}
|
2017-08-15 03:09:19 +08:00
|
|
|
fib_info_put(fi);
|
2016-07-05 17:27:50 +08:00
|
|
|
kfree(nh_grp);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_group_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
int i;
|
|
|
|
|
2017-02-08 18:16:29 +08:00
|
|
|
mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp);
|
2016-07-05 17:27:50 +08:00
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_fini(mlxsw_sp, nh);
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
2016-12-23 16:32:50 +08:00
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
|
|
|
|
WARN_ON_ONCE(nh_grp->adj_index_valid);
|
2017-08-15 03:09:19 +08:00
|
|
|
fib_info_put(mlxsw_sp_nexthop4_group_fi(nh_grp));
|
2016-07-05 17:27:50 +08:00
|
|
|
kfree(nh_grp);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
static int mlxsw_sp_nexthop4_group_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
struct fib_info *fi)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp;
|
|
|
|
|
2017-08-15 03:09:19 +08:00
|
|
|
nh_grp = mlxsw_sp_nexthop4_group_lookup(mlxsw_sp, fi);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (!nh_grp) {
|
2017-07-18 16:10:27 +08:00
|
|
|
nh_grp = mlxsw_sp_nexthop4_group_create(mlxsw_sp, fi);
|
2016-07-05 17:27:50 +08:00
|
|
|
if (IS_ERR(nh_grp))
|
|
|
|
return PTR_ERR(nh_grp);
|
|
|
|
}
|
|
|
|
list_add_tail(&fib_entry->nexthop_group_node, &nh_grp->fib_list);
|
|
|
|
fib_entry->nh_group = nh_grp;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
static void mlxsw_sp_nexthop4_group_put(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
|
|
|
|
|
|
|
|
list_del(&fib_entry->nexthop_group_node);
|
|
|
|
if (!list_empty(&nh_grp->fib_list))
|
|
|
|
return;
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_group_destroy(mlxsw_sp, nh_grp);
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
static bool
|
|
|
|
mlxsw_sp_fib4_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
|
|
|
|
|
|
|
fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry,
|
|
|
|
common);
|
|
|
|
return !fib4_entry->tos;
|
|
|
|
}
|
|
|
|
|
2017-02-08 18:16:36 +08:00
|
|
|
static bool
|
|
|
|
mlxsw_sp_fib_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_group = fib_entry->nh_group;
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
switch (fib_entry->fib_node->fib->proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
if (!mlxsw_sp_fib4_entry_should_offload(fib_entry))
|
|
|
|
return false;
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
break;
|
|
|
|
}
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2017-02-08 18:16:36 +08:00
|
|
|
switch (fib_entry->type) {
|
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE:
|
|
|
|
return !!nh_group->adj_index_valid;
|
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL:
|
2017-02-08 18:16:38 +08:00
|
|
|
return !!nh_group->nh_rif;
|
2019-02-07 03:42:01 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE:
|
2017-09-03 05:49:25 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
|
2018-10-17 16:53:07 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP:
|
2017-09-03 05:49:25 +08:00
|
|
|
return true;
|
2017-02-08 18:16:36 +08:00
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
static struct mlxsw_sp_nexthop *
|
|
|
|
mlxsw_sp_rt6_nexthop(struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
const struct mlxsw_sp_rt6 *mlxsw_sp_rt6)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
|
|
|
struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
|
2018-04-18 08:33:26 +08:00
|
|
|
struct fib6_info *rt = mlxsw_sp_rt6->rt;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2019-05-23 11:27:59 +08:00
|
|
|
if (nh->rif && nh->rif->dev == rt->fib6_nh->fib_nh_dev &&
|
2017-08-03 19:28:28 +08:00
|
|
|
ipv6_addr_equal((const struct in6_addr *) &nh->gw_addr,
|
2019-05-23 11:27:59 +08:00
|
|
|
&rt->fib6_nh->fib_nh_gw6))
|
2017-08-03 19:28:28 +08:00
|
|
|
return nh;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2017-08-02 15:56:03 +08:00
|
|
|
static void
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib4_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2017-08-02 15:56:03 +08:00
|
|
|
{
|
2020-01-14 19:23:14 +08:00
|
|
|
struct fib_info *fi = mlxsw_sp_nexthop4_group_fi(fib_entry->nh_group);
|
|
|
|
u32 *p_dst = (u32 *) fib_entry->fib_node->key.addr;
|
|
|
|
int dst_len = fib_entry->fib_node->key.prefix_len;
|
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
|
|
|
struct fib_rt_info fri;
|
|
|
|
bool should_offload;
|
2017-08-02 15:56:03 +08:00
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
should_offload = mlxsw_sp_fib_entry_should_offload(fib_entry);
|
|
|
|
fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry,
|
|
|
|
common);
|
|
|
|
fri.fi = fi;
|
|
|
|
fri.tb_id = fib4_entry->tb_id;
|
|
|
|
fri.dst = cpu_to_be32(*p_dst);
|
|
|
|
fri.dst_len = dst_len;
|
|
|
|
fri.tos = fib4_entry->tos;
|
|
|
|
fri.type = fib4_entry->type;
|
|
|
|
fri.offload = should_offload;
|
|
|
|
fri.trap = !should_offload;
|
|
|
|
fib_alias_hw_flags_set(mlxsw_sp_net(mlxsw_sp), &fri);
|
2017-08-02 15:56:03 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib4_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2017-08-02 15:56:03 +08:00
|
|
|
{
|
2020-01-14 19:23:14 +08:00
|
|
|
struct fib_info *fi = mlxsw_sp_nexthop4_group_fi(fib_entry->nh_group);
|
|
|
|
u32 *p_dst = (u32 *) fib_entry->fib_node->key.addr;
|
|
|
|
int dst_len = fib_entry->fib_node->key.prefix_len;
|
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
|
|
|
struct fib_rt_info fri;
|
2017-08-02 15:56:03 +08:00
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry,
|
|
|
|
common);
|
|
|
|
fri.fi = fi;
|
|
|
|
fri.tb_id = fib4_entry->tb_id;
|
|
|
|
fri.dst = cpu_to_be32(*p_dst);
|
|
|
|
fri.dst_len = dst_len;
|
|
|
|
fri.tos = fib4_entry->tos;
|
|
|
|
fri.type = fib4_entry->type;
|
|
|
|
fri.offload = false;
|
|
|
|
fri.trap = false;
|
|
|
|
fib_alias_hw_flags_set(mlxsw_sp_net(mlxsw_sp), &fri);
|
2017-08-02 15:56:03 +08:00
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
static void
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib6_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
2020-01-14 19:23:14 +08:00
|
|
|
bool should_offload;
|
|
|
|
|
|
|
|
should_offload = mlxsw_sp_fib_entry_should_offload(fib_entry);
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
/* In IPv6 a multipath route is represented using multiple routes, so
|
|
|
|
* we need to set the flags on all of them.
|
|
|
|
*/
|
2017-08-03 19:28:28 +08:00
|
|
|
fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry,
|
|
|
|
common);
|
2020-01-14 19:23:14 +08:00
|
|
|
list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list)
|
|
|
|
fib6_info_hw_flags_set(mlxsw_sp_rt6->rt, should_offload,
|
|
|
|
!should_offload);
|
2017-08-03 19:28:28 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib6_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
|
|
|
|
fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry,
|
|
|
|
common);
|
2020-01-14 19:23:14 +08:00
|
|
|
list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list)
|
|
|
|
fib6_info_hw_flags_set(mlxsw_sp_rt6->rt, false, false);
|
2017-08-03 19:28:28 +08:00
|
|
|
}
|
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_fib_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2017-02-08 18:16:36 +08:00
|
|
|
{
|
2017-03-10 15:53:41 +08:00
|
|
|
switch (fib_entry->fib_node->fib->proto) {
|
2017-02-08 18:16:36 +08:00
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib4_entry_hw_flags_set(mlxsw_sp, fib_entry);
|
2017-02-08 18:16:36 +08:00
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib6_entry_hw_flags_set(mlxsw_sp, fib_entry);
|
2017-08-03 19:28:28 +08:00
|
|
|
break;
|
2017-02-08 18:16:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2017-02-08 18:16:36 +08:00
|
|
|
{
|
2017-03-10 15:53:41 +08:00
|
|
|
switch (fib_entry->fib_node->fib->proto) {
|
2017-02-08 18:16:36 +08:00
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib4_entry_hw_flags_clear(mlxsw_sp, fib_entry);
|
2017-02-08 18:16:36 +08:00
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib6_entry_hw_flags_clear(mlxsw_sp, fib_entry);
|
2017-08-03 19:28:28 +08:00
|
|
|
break;
|
2017-02-08 18:16:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib_entry_hw_flags_refresh(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
2017-02-08 18:16:36 +08:00
|
|
|
{
|
|
|
|
switch (op) {
|
|
|
|
case MLXSW_REG_RALUE_OP_WRITE_WRITE:
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib_entry_hw_flags_set(mlxsw_sp, fib_entry);
|
|
|
|
break;
|
|
|
|
case MLXSW_REG_RALUE_OP_WRITE_DELETE:
|
|
|
|
mlxsw_sp_fib_entry_hw_flags_clear(mlxsw_sp, fib_entry);
|
|
|
|
break;
|
2017-02-08 18:16:36 +08:00
|
|
|
default:
|
2020-01-14 19:23:14 +08:00
|
|
|
break;
|
2017-02-08 18:16:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_fib_entry_ralue_pack(char *ralue_pl,
|
|
|
|
const struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
2016-07-05 17:27:50 +08:00
|
|
|
{
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib = fib_entry->fib_node->fib;
|
2017-07-18 16:10:24 +08:00
|
|
|
enum mlxsw_reg_ralxx_protocol proto;
|
|
|
|
u32 *p_dip;
|
|
|
|
|
|
|
|
proto = (enum mlxsw_reg_ralxx_protocol) fib->proto;
|
|
|
|
|
|
|
|
switch (fib->proto) {
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
p_dip = (u32 *) fib_entry->fib_node->key.addr;
|
|
|
|
mlxsw_reg_ralue_pack4(ralue_pl, proto, op, fib->vr->id,
|
|
|
|
fib_entry->fib_node->key.prefix_len,
|
|
|
|
*p_dip);
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
|
|
|
mlxsw_reg_ralue_pack6(ralue_pl, proto, op, fib->vr->id,
|
|
|
|
fib_entry->fib_node->key.prefix_len,
|
|
|
|
fib_entry->fib_node->key.addr);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-11-08 00:42:16 +08:00
|
|
|
static int mlxsw_sp_adj_discard_write(struct mlxsw_sp *mlxsw_sp, u16 rif_index)
|
|
|
|
{
|
|
|
|
enum mlxsw_reg_ratr_trap_action trap_action;
|
|
|
|
char ratr_pl[MLXSW_REG_RATR_LEN];
|
2019-11-14 17:54:19 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->adj_discard_index_valid)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1,
|
|
|
|
&mlxsw_sp->router->adj_discard_index);
|
|
|
|
if (err)
|
|
|
|
return err;
|
2019-11-08 00:42:16 +08:00
|
|
|
|
|
|
|
trap_action = MLXSW_REG_RATR_TRAP_ACTION_DISCARD_ERRORS;
|
|
|
|
mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY, true,
|
2019-11-24 15:48:03 +08:00
|
|
|
MLXSW_REG_RATR_TYPE_ETHERNET,
|
|
|
|
mlxsw_sp->router->adj_discard_index, rif_index);
|
2019-11-08 00:42:16 +08:00
|
|
|
mlxsw_reg_ratr_trap_action_set(ratr_pl, trap_action);
|
2019-11-14 17:54:19 +08:00
|
|
|
err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl);
|
|
|
|
if (err)
|
|
|
|
goto err_ratr_write;
|
|
|
|
|
|
|
|
mlxsw_sp->router->adj_discard_index_valid = true;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_ratr_write:
|
|
|
|
mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1,
|
|
|
|
mlxsw_sp->router->adj_discard_index);
|
|
|
|
return err;
|
2019-11-08 00:42:16 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
static int mlxsw_sp_fib_entry_op_remote(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
|
|
|
{
|
2019-11-08 00:42:16 +08:00
|
|
|
struct mlxsw_sp_nexthop_group *nh_group = fib_entry->nh_group;
|
2017-07-18 16:10:24 +08:00
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
2016-07-05 17:27:50 +08:00
|
|
|
enum mlxsw_reg_ralue_trap_action trap_action;
|
|
|
|
u16 trap_id = 0;
|
|
|
|
u32 adjacency_index = 0;
|
|
|
|
u16 ecmp_size = 0;
|
2019-11-08 00:42:16 +08:00
|
|
|
int err;
|
2016-07-05 17:27:50 +08:00
|
|
|
|
|
|
|
/* In case the nexthop group adjacency index is valid, use it
|
|
|
|
* with provided ECMP size. Otherwise, setup trap and pass
|
|
|
|
* traffic to kernel.
|
|
|
|
*/
|
2017-02-08 18:16:37 +08:00
|
|
|
if (mlxsw_sp_fib_entry_should_offload(fib_entry)) {
|
2016-07-05 17:27:50 +08:00
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
|
|
|
|
adjacency_index = fib_entry->nh_group->adj_index;
|
|
|
|
ecmp_size = fib_entry->nh_group->ecmp_size;
|
2019-11-08 00:42:16 +08:00
|
|
|
} else if (!nh_group->adj_index_valid && nh_group->count &&
|
|
|
|
nh_group->nh_rif) {
|
|
|
|
err = mlxsw_sp_adj_discard_write(mlxsw_sp,
|
|
|
|
nh_group->nh_rif->rif_index);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
|
|
|
|
adjacency_index = mlxsw_sp->router->adj_discard_index;
|
|
|
|
ecmp_size = 1;
|
2016-07-05 17:27:50 +08:00
|
|
|
} else {
|
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
|
|
|
|
trap_id = MLXSW_TRAP_ID_RTR_INGRESS0;
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
|
2016-07-05 17:27:50 +08:00
|
|
|
mlxsw_reg_ralue_act_remote_pack(ralue_pl, trap_action, trap_id,
|
|
|
|
adjacency_index, ecmp_size);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
static int mlxsw_sp_fib_entry_op_local(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
2016-07-04 14:23:11 +08:00
|
|
|
{
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif = fib_entry->nh_group->nh_rif;
|
2017-02-08 18:16:38 +08:00
|
|
|
enum mlxsw_reg_ralue_trap_action trap_action;
|
2016-07-04 14:23:11 +08:00
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
2017-02-08 18:16:38 +08:00
|
|
|
u16 trap_id = 0;
|
2017-03-17 16:38:00 +08:00
|
|
|
u16 rif_index = 0;
|
2017-02-08 18:16:38 +08:00
|
|
|
|
|
|
|
if (mlxsw_sp_fib_entry_should_offload(fib_entry)) {
|
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
|
2017-03-17 16:38:00 +08:00
|
|
|
rif_index = rif->rif_index;
|
2017-02-08 18:16:38 +08:00
|
|
|
} else {
|
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
|
|
|
|
trap_id = MLXSW_TRAP_ID_RTR_INGRESS0;
|
|
|
|
}
|
2016-07-04 14:23:11 +08:00
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
|
2017-03-17 16:38:00 +08:00
|
|
|
mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, trap_id,
|
|
|
|
rif_index);
|
2016-07-04 14:23:11 +08:00
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
static int mlxsw_sp_fib_entry_op_trap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
2016-07-04 14:23:11 +08:00
|
|
|
{
|
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
|
2016-07-04 14:23:11 +08:00
|
|
|
mlxsw_reg_ralue_act_ip2me_pack(ralue_pl);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
|
|
|
|
}
|
|
|
|
|
2019-02-07 03:42:01 +08:00
|
|
|
static int mlxsw_sp_fib_entry_op_blackhole(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
|
|
|
{
|
|
|
|
enum mlxsw_reg_ralue_trap_action trap_action;
|
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
|
|
|
|
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_DISCARD_ERROR;
|
|
|
|
mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
|
|
|
|
mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, 0, 0);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
|
|
|
|
}
|
|
|
|
|
2019-11-08 00:42:15 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_fib_entry_op_unreachable(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
|
|
|
{
|
|
|
|
enum mlxsw_reg_ralue_trap_action trap_action;
|
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
|
|
|
u16 trap_id;
|
|
|
|
|
|
|
|
trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
|
|
|
|
trap_id = MLXSW_TRAP_ID_RTR_INGRESS1;
|
|
|
|
|
|
|
|
mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
|
|
|
|
mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, trap_id, 0);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:25 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_fib_entry_op_ipip_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry = fib_entry->decap.ipip_entry;
|
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
|
|
|
|
if (WARN_ON(!ipip_entry))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
|
|
|
|
return ipip_ops->fib_entry_op(mlxsw_sp, ipip_entry, op,
|
|
|
|
fib_entry->decap.tunnel_index);
|
|
|
|
}
|
|
|
|
|
2018-10-17 16:53:07 +08:00
|
|
|
static int mlxsw_sp_fib_entry_op_nve_decap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
|
|
|
{
|
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
|
|
|
|
|
|
|
mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
|
|
|
|
mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl,
|
|
|
|
fib_entry->decap.tunnel_index);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:24 +08:00
|
|
|
static int __mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
2016-07-04 14:23:11 +08:00
|
|
|
{
|
|
|
|
switch (fib_entry->type) {
|
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE:
|
2017-07-18 16:10:24 +08:00
|
|
|
return mlxsw_sp_fib_entry_op_remote(mlxsw_sp, fib_entry, op);
|
2016-07-04 14:23:11 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL:
|
2017-07-18 16:10:24 +08:00
|
|
|
return mlxsw_sp_fib_entry_op_local(mlxsw_sp, fib_entry, op);
|
2016-07-04 14:23:11 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_TRAP:
|
2017-07-18 16:10:24 +08:00
|
|
|
return mlxsw_sp_fib_entry_op_trap(mlxsw_sp, fib_entry, op);
|
2019-02-07 03:42:01 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE:
|
|
|
|
return mlxsw_sp_fib_entry_op_blackhole(mlxsw_sp, fib_entry, op);
|
2019-11-08 00:42:15 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE:
|
|
|
|
return mlxsw_sp_fib_entry_op_unreachable(mlxsw_sp, fib_entry,
|
|
|
|
op);
|
2017-09-03 05:49:25 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
|
|
|
|
return mlxsw_sp_fib_entry_op_ipip_decap(mlxsw_sp,
|
|
|
|
fib_entry, op);
|
2018-10-17 16:53:07 +08:00
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP:
|
|
|
|
return mlxsw_sp_fib_entry_op_nve_decap(mlxsw_sp, fib_entry, op);
|
2016-07-04 14:23:11 +08:00
|
|
|
}
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
|
|
|
enum mlxsw_reg_ralue_op op)
|
|
|
|
{
|
2017-07-18 16:10:24 +08:00
|
|
|
int err = __mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry, op);
|
2017-02-08 18:16:36 +08:00
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
mlxsw_sp_fib_entry_hw_flags_refresh(mlxsw_sp, fib_entry, op);
|
2017-07-18 16:10:24 +08:00
|
|
|
|
2017-02-08 18:16:36 +08:00
|
|
|
return err;
|
2016-07-04 14:23:11 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
2016-09-01 16:37:41 +08:00
|
|
|
return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry,
|
|
|
|
MLXSW_REG_RALUE_OP_WRITE_WRITE);
|
2016-07-04 14:23:11 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_fib_entry_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
|
|
|
return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry,
|
|
|
|
MLXSW_REG_RALUE_OP_WRITE_DELETE);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
2017-02-08 18:16:36 +08:00
|
|
|
mlxsw_sp_fib4_entry_type_set(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct fib_entry_notifier_info *fen_info,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
2016-07-04 14:23:11 +08:00
|
|
|
{
|
2019-06-04 11:19:49 +08:00
|
|
|
struct net_device *dev = fib_info_nh(fen_info->fi, 0)->fib_nh_dev;
|
2017-09-03 05:49:25 +08:00
|
|
|
union mlxsw_sp_l3addr dip = { .addr4 = htonl(fen_info->dst) };
|
2020-02-22 01:54:08 +08:00
|
|
|
struct mlxsw_sp_router *router = mlxsw_sp->router;
|
2018-10-17 16:53:19 +08:00
|
|
|
u32 tb_id = mlxsw_sp_fix_tb_id(fen_info->tb_id);
|
2017-09-03 05:49:25 +08:00
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
2016-09-26 18:52:31 +08:00
|
|
|
struct fib_info *fi = fen_info->fi;
|
2016-07-04 14:23:11 +08:00
|
|
|
|
2017-03-10 15:53:38 +08:00
|
|
|
switch (fen_info->type) {
|
|
|
|
case RTN_LOCAL:
|
2017-09-03 05:49:25 +08:00
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_decap(mlxsw_sp, dev,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV4, dip);
|
2017-11-28 20:17:11 +08:00
|
|
|
if (ipip_entry && ipip_entry->ol_dev->flags & IFF_UP) {
|
2017-09-03 05:49:25 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP;
|
|
|
|
return mlxsw_sp_fib_entry_decap_init(mlxsw_sp,
|
|
|
|
fib_entry,
|
|
|
|
ipip_entry);
|
|
|
|
}
|
2020-02-22 01:54:08 +08:00
|
|
|
if (mlxsw_sp_router_nve_is_decap(mlxsw_sp, tb_id,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV4,
|
|
|
|
&dip)) {
|
|
|
|
u32 tunnel_index;
|
2018-10-17 16:53:19 +08:00
|
|
|
|
2020-02-22 01:54:08 +08:00
|
|
|
tunnel_index = router->nve_decap_config.tunnel_index;
|
|
|
|
fib_entry->decap.tunnel_index = tunnel_index;
|
2018-10-17 16:53:19 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP;
|
|
|
|
return 0;
|
|
|
|
}
|
2017-09-03 05:49:25 +08:00
|
|
|
/* fall through */
|
|
|
|
case RTN_BROADCAST:
|
2016-07-04 14:23:11 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
|
|
|
|
return 0;
|
2019-02-07 03:42:01 +08:00
|
|
|
case RTN_BLACKHOLE:
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE;
|
|
|
|
return 0;
|
2017-03-10 15:53:38 +08:00
|
|
|
case RTN_UNREACHABLE: /* fall through */
|
|
|
|
case RTN_PROHIBIT:
|
|
|
|
/* Packets hitting these routes need to be trapped, but
|
|
|
|
* can do so with a lower priority than packets directed
|
|
|
|
* at the host, so use action type local instead of trap.
|
|
|
|
*/
|
2019-11-08 00:42:15 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE;
|
2017-03-10 15:53:38 +08:00
|
|
|
return 0;
|
|
|
|
case RTN_UNICAST:
|
2017-09-03 05:49:20 +08:00
|
|
|
if (mlxsw_sp_fi_is_gateway(mlxsw_sp, fi))
|
2017-03-10 15:53:38 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE;
|
2017-09-03 05:49:20 +08:00
|
|
|
else
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
|
2017-03-10 15:53:38 +08:00
|
|
|
return 0;
|
|
|
|
default:
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
2016-07-05 17:27:50 +08:00
|
|
|
}
|
|
|
|
|
2019-12-27 00:41:15 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_fib4_entry_type_unset(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
|
|
|
switch (fib_entry->type) {
|
|
|
|
case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
|
|
|
|
mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, fib_entry);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
static struct mlxsw_sp_fib4_entry *
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
mlxsw_sp_fib4_entry_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node,
|
|
|
|
const struct fib_entry_notifier_info *fen_info)
|
2016-07-04 14:23:11 +08:00
|
|
|
{
|
2017-07-18 16:10:26 +08:00
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
2016-07-04 14:23:11 +08:00
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
|
|
|
int err;
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
fib4_entry = kzalloc(sizeof(*fib4_entry), GFP_KERNEL);
|
|
|
|
if (!fib4_entry)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
fib_entry = &fib4_entry->common;
|
2016-07-04 14:23:11 +08:00
|
|
|
|
2017-02-08 18:16:36 +08:00
|
|
|
err = mlxsw_sp_fib4_entry_type_set(mlxsw_sp, fen_info, fib_entry);
|
2016-07-04 14:23:11 +08:00
|
|
|
if (err)
|
2017-02-08 18:16:36 +08:00
|
|
|
goto err_fib4_entry_type_set;
|
2016-07-04 14:23:11 +08:00
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
err = mlxsw_sp_nexthop4_group_get(mlxsw_sp, fib_entry, fen_info->fi);
|
2017-02-08 18:16:33 +08:00
|
|
|
if (err)
|
2017-07-18 16:10:27 +08:00
|
|
|
goto err_nexthop4_group_get;
|
2017-02-08 18:16:33 +08:00
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
fib4_entry->prio = fen_info->fi->fib_priority;
|
|
|
|
fib4_entry->tb_id = fen_info->tb_id;
|
|
|
|
fib4_entry->type = fen_info->type;
|
|
|
|
fib4_entry->tos = fen_info->tos;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
|
|
|
fib_entry->fib_node = fib_node;
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
return fib4_entry;
|
2016-09-01 16:37:40 +08:00
|
|
|
|
2017-07-18 16:10:27 +08:00
|
|
|
err_nexthop4_group_get:
|
2019-12-27 00:41:15 +08:00
|
|
|
mlxsw_sp_fib4_entry_type_unset(mlxsw_sp, fib_entry);
|
2017-02-08 18:16:36 +08:00
|
|
|
err_fib4_entry_type_set:
|
2017-07-18 16:10:26 +08:00
|
|
|
kfree(fib4_entry);
|
2016-09-01 16:37:40 +08:00
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
static void mlxsw_sp_fib4_entry_destroy(struct mlxsw_sp *mlxsw_sp,
|
2017-07-18 16:10:26 +08:00
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry)
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
{
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_group_put(mlxsw_sp, &fib4_entry->common);
|
2019-12-27 00:41:15 +08:00
|
|
|
mlxsw_sp_fib4_entry_type_unset(mlxsw_sp, &fib4_entry->common);
|
2017-07-18 16:10:26 +08:00
|
|
|
kfree(fib4_entry);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
static struct mlxsw_sp_fib4_entry *
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
mlxsw_sp_fib4_entry_lookup(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct fib_entry_notifier_info *fen_info)
|
2016-09-01 16:37:40 +08:00
|
|
|
{
|
2017-07-18 16:10:26 +08:00
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2017-07-18 16:10:20 +08:00
|
|
|
struct mlxsw_sp_fib *fib;
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, fen_info->tb_id);
|
|
|
|
if (!vr)
|
|
|
|
return NULL;
|
|
|
|
fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV4);
|
2016-09-01 16:37:40 +08:00
|
|
|
|
2017-07-18 16:10:20 +08:00
|
|
|
fib_node = mlxsw_sp_fib_node_lookup(fib, &fen_info->dst,
|
|
|
|
sizeof(fen_info->dst),
|
|
|
|
fen_info->dst_len);
|
|
|
|
if (!fib_node)
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
return NULL;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
fib4_entry = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib4_entry, common);
|
|
|
|
if (fib4_entry->tb_id == fen_info->tb_id &&
|
|
|
|
fib4_entry->tos == fen_info->tos &&
|
|
|
|
fib4_entry->type == fen_info->type &&
|
|
|
|
mlxsw_sp_nexthop4_group_fi(fib4_entry->common.nh_group) ==
|
|
|
|
fen_info->fi)
|
|
|
|
return fib4_entry;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rhashtable_params mlxsw_sp_fib_ht_params = {
|
|
|
|
.key_offset = offsetof(struct mlxsw_sp_fib_node, key),
|
|
|
|
.head_offset = offsetof(struct mlxsw_sp_fib_node, ht_node),
|
|
|
|
.key_len = sizeof(struct mlxsw_sp_fib_key),
|
|
|
|
.automatic_shrinking = true,
|
|
|
|
};
|
|
|
|
|
|
|
|
static int mlxsw_sp_fib_node_insert(struct mlxsw_sp_fib *fib,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
|
|
|
return rhashtable_insert_fast(&fib->ht, &fib_node->ht_node,
|
|
|
|
mlxsw_sp_fib_ht_params);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_fib_node_remove(struct mlxsw_sp_fib *fib,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
|
|
|
rhashtable_remove_fast(&fib->ht, &fib_node->ht_node,
|
|
|
|
mlxsw_sp_fib_ht_params);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fib_node *
|
|
|
|
mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr,
|
|
|
|
size_t addr_len, unsigned char prefix_len)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_key key;
|
|
|
|
|
|
|
|
memset(&key, 0, sizeof(key));
|
|
|
|
memcpy(key.addr, addr, addr_len);
|
|
|
|
key.prefix_len = prefix_len;
|
|
|
|
return rhashtable_lookup_fast(&fib->ht, &key, mlxsw_sp_fib_ht_params);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fib_node *
|
2017-03-10 15:53:41 +08:00
|
|
|
mlxsw_sp_fib_node_create(struct mlxsw_sp_fib *fib, const void *addr,
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
size_t addr_len, unsigned char prefix_len)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
|
|
|
|
|
|
|
fib_node = kzalloc(sizeof(*fib_node), GFP_KERNEL);
|
|
|
|
if (!fib_node)
|
2016-09-01 16:37:40 +08:00
|
|
|
return NULL;
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
list_add(&fib_node->list, &fib->node_list);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
memcpy(fib_node->key.addr, addr, addr_len);
|
|
|
|
fib_node->key.prefix_len = prefix_len;
|
|
|
|
|
|
|
|
return fib_node;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_fib_node_destroy(struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
|
|
|
list_del(&fib_node->list);
|
|
|
|
kfree(fib_node);
|
|
|
|
}
|
|
|
|
|
2017-08-14 16:54:05 +08:00
|
|
|
static int mlxsw_sp_fib_lpm_tree_link(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_prefix_usage req_prefix_usage;
|
2018-01-22 16:17:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib = fib_node->fib;
|
2017-08-14 16:54:05 +08:00
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree;
|
|
|
|
int err;
|
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
lpm_tree = mlxsw_sp->router->lpm.proto_trees[fib->proto];
|
|
|
|
if (lpm_tree->prefix_ref_count[fib_node->key.prefix_len] != 0)
|
|
|
|
goto out;
|
2017-08-14 16:54:05 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_prefix_usage_cpy(&req_prefix_usage, &lpm_tree->prefix_usage);
|
|
|
|
mlxsw_sp_prefix_usage_set(&req_prefix_usage, fib_node->key.prefix_len);
|
2017-08-14 16:54:05 +08:00
|
|
|
lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
|
|
|
|
fib->proto);
|
|
|
|
if (IS_ERR(lpm_tree))
|
|
|
|
return PTR_ERR(lpm_tree);
|
|
|
|
|
|
|
|
err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree);
|
|
|
|
if (err)
|
2018-01-22 16:17:42 +08:00
|
|
|
goto err_lpm_tree_replace;
|
2017-08-14 16:54:05 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
out:
|
|
|
|
lpm_tree->prefix_ref_count[fib_node->key.prefix_len]++;
|
2017-08-14 16:54:05 +08:00
|
|
|
return 0;
|
2018-01-22 16:17:42 +08:00
|
|
|
|
|
|
|
err_lpm_tree_replace:
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
|
|
|
|
return err;
|
2017-08-14 16:54:05 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_fib_lpm_tree_unlink(struct mlxsw_sp *mlxsw_sp,
|
2018-01-22 16:17:41 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
2017-08-14 16:54:05 +08:00
|
|
|
{
|
2018-01-22 16:17:42 +08:00
|
|
|
struct mlxsw_sp_lpm_tree *lpm_tree = fib_node->fib->lpm_tree;
|
|
|
|
struct mlxsw_sp_prefix_usage req_prefix_usage;
|
2018-01-22 16:17:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib = fib_node->fib;
|
2018-01-22 16:17:42 +08:00
|
|
|
int err;
|
2018-01-22 16:17:41 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
if (--lpm_tree->prefix_ref_count[fib_node->key.prefix_len] != 0)
|
2017-08-14 16:54:05 +08:00
|
|
|
return;
|
2018-01-22 16:17:42 +08:00
|
|
|
/* Try to construct a new LPM tree from the current prefix usage
|
|
|
|
* minus the unused one. If we fail, continue using the old one.
|
2018-01-22 16:17:40 +08:00
|
|
|
*/
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_prefix_usage_cpy(&req_prefix_usage, &lpm_tree->prefix_usage);
|
|
|
|
mlxsw_sp_prefix_usage_clear(&req_prefix_usage,
|
|
|
|
fib_node->key.prefix_len);
|
|
|
|
lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
|
|
|
|
fib->proto);
|
|
|
|
if (IS_ERR(lpm_tree))
|
|
|
|
return;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree);
|
|
|
|
if (err)
|
|
|
|
goto err_lpm_tree_replace;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
return;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2018-01-22 16:17:42 +08:00
|
|
|
err_lpm_tree_replace:
|
|
|
|
mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
|
2016-09-01 16:37:40 +08:00
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
static int mlxsw_sp_fib_node_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node,
|
|
|
|
struct mlxsw_sp_fib *fib)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_fib_node_insert(fib, fib_node);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
fib_node->fib = fib;
|
|
|
|
|
2018-01-22 16:17:41 +08:00
|
|
|
err = mlxsw_sp_fib_lpm_tree_link(mlxsw_sp, fib_node);
|
2017-08-14 16:54:05 +08:00
|
|
|
if (err)
|
|
|
|
goto err_fib_lpm_tree_link;
|
2017-03-10 15:53:41 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
2017-08-14 16:54:05 +08:00
|
|
|
err_fib_lpm_tree_link:
|
2017-03-10 15:53:41 +08:00
|
|
|
fib_node->fib = NULL;
|
|
|
|
mlxsw_sp_fib_node_remove(fib, fib_node);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_fib_node_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib *fib = fib_node->fib;
|
|
|
|
|
2018-01-22 16:17:41 +08:00
|
|
|
mlxsw_sp_fib_lpm_tree_unlink(mlxsw_sp, fib_node);
|
2017-03-10 15:53:41 +08:00
|
|
|
fib_node->fib = NULL;
|
|
|
|
mlxsw_sp_fib_node_remove(fib, fib_node);
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
static struct mlxsw_sp_fib_node *
|
2017-07-18 16:10:21 +08:00
|
|
|
mlxsw_sp_fib_node_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id, const void *addr,
|
|
|
|
size_t addr_len, unsigned char prefix_len,
|
|
|
|
enum mlxsw_sp_l3proto proto)
|
2016-09-01 16:37:40 +08:00
|
|
|
{
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
int err;
|
|
|
|
|
2017-10-19 00:56:56 +08:00
|
|
|
vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, NULL);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
if (IS_ERR(vr))
|
|
|
|
return ERR_CAST(vr);
|
2017-07-18 16:10:21 +08:00
|
|
|
fib = mlxsw_sp_vr_fib(vr, proto);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2017-07-18 16:10:21 +08:00
|
|
|
fib_node = mlxsw_sp_fib_node_lookup(fib, addr, addr_len, prefix_len);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
if (fib_node)
|
|
|
|
return fib_node;
|
2016-09-01 16:37:40 +08:00
|
|
|
|
2017-07-18 16:10:21 +08:00
|
|
|
fib_node = mlxsw_sp_fib_node_create(fib, addr, addr_len, prefix_len);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
if (!fib_node) {
|
|
|
|
err = -ENOMEM;
|
|
|
|
goto err_fib_node_create;
|
2016-09-01 16:37:40 +08:00
|
|
|
}
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
err = mlxsw_sp_fib_node_init(mlxsw_sp, fib_node, fib);
|
|
|
|
if (err)
|
|
|
|
goto err_fib_node_init;
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
return fib_node;
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
err_fib_node_init:
|
|
|
|
mlxsw_sp_fib_node_destroy(fib_node);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
err_fib_node_create:
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
return ERR_PTR(err);
|
2016-09-01 16:37:40 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:21 +08:00
|
|
|
static void mlxsw_sp_fib_node_put(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
2016-09-01 16:37:40 +08:00
|
|
|
{
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_vr *vr = fib_node->fib->vr;
|
2016-09-01 16:37:40 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
if (fib_node->fib_entry)
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
return;
|
2017-03-10 15:53:41 +08:00
|
|
|
mlxsw_sp_fib_node_fini(mlxsw_sp, fib_node);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
mlxsw_sp_fib_node_destroy(fib_node);
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
2016-07-04 14:23:11 +08:00
|
|
|
}
|
|
|
|
|
2019-12-27 00:41:16 +08:00
|
|
|
static int mlxsw_sp_fib_node_entry_link(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
{
|
2019-12-27 00:41:16 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
int err;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
fib_node->fib_entry = fib_entry;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
if (err)
|
2019-12-27 00:41:17 +08:00
|
|
|
goto err_fib_entry_update;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
err_fib_entry_update:
|
|
|
|
fib_node->fib_entry = NULL;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2019-12-27 00:41:16 +08:00
|
|
|
mlxsw_sp_fib_node_entry_unlink(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
{
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node;
|
2017-02-09 17:28:44 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
mlxsw_sp_fib_entry_del(mlxsw_sp, fib_entry);
|
|
|
|
fib_node->fib_entry = NULL;
|
2017-02-09 17:28:44 +08:00
|
|
|
}
|
|
|
|
|
2020-02-08 01:26:24 +08:00
|
|
|
static bool mlxsw_sp_fib4_allow_replace(struct mlxsw_sp_fib4_entry *fib4_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_node *fib_node = fib4_entry->common.fib_node;
|
|
|
|
struct mlxsw_sp_fib4_entry *fib4_replaced;
|
|
|
|
|
|
|
|
if (!fib_node->fib_entry)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
fib4_replaced = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib4_entry, common);
|
|
|
|
if (fib4_entry->tb_id == RT_TABLE_MAIN &&
|
|
|
|
fib4_replaced->tb_id == RT_TABLE_LOCAL)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
static int
|
2019-12-14 23:53:14 +08:00
|
|
|
mlxsw_sp_router_fib4_replace(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct fib_entry_notifier_info *fen_info)
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
{
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry, *fib4_replaced;
|
|
|
|
struct mlxsw_sp_fib_entry *replaced;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2016-07-04 14:23:11 +08:00
|
|
|
int err;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
if (mlxsw_sp->router->aborted)
|
2016-09-26 18:52:31 +08:00
|
|
|
return 0;
|
|
|
|
|
2017-07-18 16:10:21 +08:00
|
|
|
fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, fen_info->tb_id,
|
|
|
|
&fen_info->dst, sizeof(fen_info->dst),
|
|
|
|
fen_info->dst_len,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV4);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
if (IS_ERR(fib_node)) {
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to get FIB node\n");
|
|
|
|
return PTR_ERR(fib_node);
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|
2016-07-04 14:23:11 +08:00
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
fib4_entry = mlxsw_sp_fib4_entry_create(mlxsw_sp, fib_node, fen_info);
|
|
|
|
if (IS_ERR(fib4_entry)) {
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to create FIB entry\n");
|
2017-07-18 16:10:26 +08:00
|
|
|
err = PTR_ERR(fib4_entry);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
goto err_fib4_entry_create;
|
|
|
|
}
|
2016-09-01 16:37:40 +08:00
|
|
|
|
2020-02-08 01:26:24 +08:00
|
|
|
if (!mlxsw_sp_fib4_allow_replace(fib4_entry)) {
|
|
|
|
mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
|
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
replaced = fib_node->fib_entry;
|
2019-12-27 00:41:16 +08:00
|
|
|
err = mlxsw_sp_fib_node_entry_link(mlxsw_sp, &fib4_entry->common);
|
2016-09-26 18:52:31 +08:00
|
|
|
if (err) {
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to link FIB entry to node\n");
|
2019-12-27 00:41:16 +08:00
|
|
|
goto err_fib_node_entry_link;
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
/* Nothing to replace */
|
|
|
|
if (!replaced)
|
|
|
|
return 0;
|
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib_entry_hw_flags_clear(mlxsw_sp, replaced);
|
2019-12-27 00:41:17 +08:00
|
|
|
fib4_replaced = container_of(replaced, struct mlxsw_sp_fib4_entry,
|
|
|
|
common);
|
|
|
|
mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_replaced);
|
2017-02-09 17:28:44 +08:00
|
|
|
|
2016-07-04 14:23:11 +08:00
|
|
|
return 0;
|
|
|
|
|
2019-12-27 00:41:16 +08:00
|
|
|
err_fib_node_entry_link:
|
2019-12-27 00:41:17 +08:00
|
|
|
fib_node->fib_entry = replaced;
|
2017-07-18 16:10:26 +08:00
|
|
|
mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
err_fib4_entry_create:
|
2017-07-18 16:10:21 +08:00
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
2016-07-04 14:23:11 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2016-10-20 22:05:43 +08:00
|
|
|
static void mlxsw_sp_router_fib4_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct fib_entry_notifier_info *fen_info)
|
2016-07-04 14:23:11 +08:00
|
|
|
{
|
2017-07-18 16:10:26 +08:00
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2016-07-04 14:23:11 +08:00
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
if (mlxsw_sp->router->aborted)
|
2016-10-20 22:05:43 +08:00
|
|
|
return;
|
2016-09-26 18:52:31 +08:00
|
|
|
|
2017-07-18 16:10:26 +08:00
|
|
|
fib4_entry = mlxsw_sp_fib4_entry_lookup(mlxsw_sp, fen_info);
|
2020-02-08 01:26:24 +08:00
|
|
|
if (!fib4_entry)
|
2016-10-20 22:05:43 +08:00
|
|
|
return;
|
2017-07-18 16:10:26 +08:00
|
|
|
fib_node = fib4_entry->common.fib_node;
|
2016-09-01 16:37:40 +08:00
|
|
|
|
2019-12-27 00:41:16 +08:00
|
|
|
mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, &fib4_entry->common);
|
2017-07-18 16:10:26 +08:00
|
|
|
mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
|
2017-07-18 16:10:21 +08:00
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
2016-07-04 14:23:11 +08:00
|
|
|
}
|
2016-09-26 18:52:31 +08:00
|
|
|
|
2018-04-18 08:33:26 +08:00
|
|
|
static bool mlxsw_sp_fib6_rt_should_ignore(const struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
/* Packets with link-local destination IP arriving to the router
|
|
|
|
* are trapped to the CPU, so no need to program specific routes
|
|
|
|
* for them.
|
|
|
|
*/
|
2018-04-19 06:38:59 +08:00
|
|
|
if (ipv6_addr_type(&rt->fib6_dst.addr) & IPV6_ADDR_LINKLOCAL)
|
2017-08-03 19:28:28 +08:00
|
|
|
return true;
|
|
|
|
|
|
|
|
/* Multicast routes aren't supported, so ignore them. Neighbour
|
|
|
|
* Discovery packets are specifically trapped.
|
|
|
|
*/
|
2018-04-19 06:38:59 +08:00
|
|
|
if (ipv6_addr_type(&rt->fib6_dst.addr) & IPV6_ADDR_MULTICAST)
|
2017-08-03 19:28:28 +08:00
|
|
|
return true;
|
|
|
|
|
|
|
|
/* Cloned routes are irrelevant in the forwarding path. */
|
2018-04-19 06:38:59 +08:00
|
|
|
if (rt->fib6_flags & RTF_CACHE)
|
2017-08-03 19:28:28 +08:00
|
|
|
return true;
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2018-04-18 08:33:26 +08:00
|
|
|
static struct mlxsw_sp_rt6 *mlxsw_sp_rt6_create(struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
|
|
|
|
mlxsw_sp_rt6 = kzalloc(sizeof(*mlxsw_sp_rt6), GFP_KERNEL);
|
|
|
|
if (!mlxsw_sp_rt6)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
|
|
|
|
/* In case of route replace, replaced route is deleted with
|
|
|
|
* no notification. Take reference to prevent accessing freed
|
|
|
|
* memory.
|
|
|
|
*/
|
|
|
|
mlxsw_sp_rt6->rt = rt;
|
2018-04-18 08:33:26 +08:00
|
|
|
fib6_info_hold(rt);
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
return mlxsw_sp_rt6;
|
|
|
|
}
|
|
|
|
|
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
2018-04-18 08:33:26 +08:00
|
|
|
static void mlxsw_sp_rt6_release(struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
2018-04-18 08:33:26 +08:00
|
|
|
fib6_info_release(rt);
|
2017-08-03 19:28:28 +08:00
|
|
|
}
|
|
|
|
#else
|
2018-04-18 08:33:26 +08:00
|
|
|
static void mlxsw_sp_rt6_release(struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static void mlxsw_sp_rt6_destroy(struct mlxsw_sp_rt6 *mlxsw_sp_rt6)
|
|
|
|
{
|
2020-02-08 01:26:26 +08:00
|
|
|
struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh;
|
|
|
|
|
|
|
|
fib6_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_rt6_release(mlxsw_sp_rt6->rt);
|
|
|
|
kfree(mlxsw_sp_rt6);
|
|
|
|
}
|
|
|
|
|
2018-04-18 08:33:26 +08:00
|
|
|
static struct fib6_info *
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_fib6_entry_rt(const struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
return list_first_entry(&fib6_entry->rt6_list, struct mlxsw_sp_rt6,
|
|
|
|
list)->rt;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_rt6 *
|
|
|
|
mlxsw_sp_fib6_entry_rt_find(const struct mlxsw_sp_fib6_entry *fib6_entry,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
|
|
|
|
list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
|
|
|
|
if (mlxsw_sp_rt6->rt == rt)
|
|
|
|
return mlxsw_sp_rt6;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:24 +08:00
|
|
|
static bool mlxsw_sp_nexthop6_ipip_type(const struct mlxsw_sp *mlxsw_sp,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt,
|
2017-09-03 05:49:24 +08:00
|
|
|
enum mlxsw_sp_ipip_type *ret)
|
|
|
|
{
|
2019-05-23 11:27:59 +08:00
|
|
|
return rt->fib6_nh->fib_nh_dev &&
|
|
|
|
mlxsw_sp_netdev_ipip_type(mlxsw_sp, rt->fib6_nh->fib_nh_dev, ret);
|
2017-09-03 05:49:24 +08:00
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
static int mlxsw_sp_nexthop6_type_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
struct mlxsw_sp_nexthop *nh,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
2017-11-28 20:17:13 +08:00
|
|
|
const struct mlxsw_sp_ipip_ops *ipip_ops;
|
|
|
|
struct mlxsw_sp_ipip_entry *ipip_entry;
|
2019-05-23 11:27:59 +08:00
|
|
|
struct net_device *dev = rt->fib6_nh->fib_nh_dev;
|
2017-08-03 19:28:28 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
int err;
|
|
|
|
|
2017-11-28 20:17:13 +08:00
|
|
|
ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, dev);
|
|
|
|
if (ipip_entry) {
|
|
|
|
ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
|
|
|
|
if (ipip_ops->can_offload(mlxsw_sp, dev,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV6)) {
|
|
|
|
nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP;
|
|
|
|
mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, ipip_entry);
|
|
|
|
return 0;
|
|
|
|
}
|
2017-09-03 05:49:24 +08:00
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH;
|
2017-08-03 19:28:28 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!rif)
|
|
|
|
return 0;
|
|
|
|
mlxsw_sp_nexthop_rif_init(nh, rif);
|
|
|
|
|
|
|
|
err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop_neigh_init;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_nexthop_neigh_init:
|
|
|
|
mlxsw_sp_nexthop_rif_fini(nh);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
static void mlxsw_sp_nexthop6_type_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
|
|
|
mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_nexthop6_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp,
|
|
|
|
struct mlxsw_sp_nexthop *nh,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt)
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
{
|
2019-05-23 11:27:59 +08:00
|
|
|
struct net_device *dev = rt->fib6_nh->fib_nh_dev;
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
|
|
|
|
nh->nh_grp = nh_grp;
|
2019-05-23 11:27:59 +08:00
|
|
|
nh->nh_weight = rt->fib6_nh->fib_nh_weight;
|
|
|
|
memcpy(&nh->gw_addr, &rt->fib6_nh->fib_nh_gw6, sizeof(nh->gw_addr));
|
2017-09-25 16:32:28 +08:00
|
|
|
mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh);
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
|
2017-09-25 16:32:23 +08:00
|
|
|
list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list);
|
|
|
|
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
if (!dev)
|
|
|
|
return 0;
|
|
|
|
nh->ifindex = dev->ifindex;
|
|
|
|
|
|
|
|
return mlxsw_sp_nexthop6_type_init(mlxsw_sp, nh_grp, nh, rt);
|
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
static void mlxsw_sp_nexthop6_fini(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop *nh)
|
|
|
|
{
|
mlxsw: spectrum_router: Make nexthops typed
In the router, some next hops may reference an encapsulating netdevice,
such as GRE or IPIP. To properly offload these next hops, mlxsw needs to
keep track of whether a given next hop is a regular Ethernet entry, or
an IP-in-IP tunneling entry.
To facilitate this book-keeping, add a type field to struct
mlxsw_sp_nexthop. There is, as of this patch, only one next hop type:
MLXSW_SP_NEXTHOP_TYPE_ETH. Follow-up patches will introduce the IP-in-IP
variant.
There are several places where next hops are initialized in the IPv4
path. Instead of replicating the logic at every one of them, factor it
out to a function mlxsw_sp_nexthop4_type_init(). The corresponding fini
is actually protocol-neutral, so put it to mlxsw_sp_nexthop_type_fini(),
but create a corresponding protocoled _fini function that dispatches to
the protocol-neutral one.
The IPv6 path is simpler, but for symmetry with IPv4, create the same
suite of functions with corresponding logic.
Signed-off-by: Petr Machata <petrm@mellanox.com>
Reviewed-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-09-03 05:49:22 +08:00
|
|
|
mlxsw_sp_nexthop6_type_fini(mlxsw_sp, nh);
|
2017-09-25 16:32:23 +08:00
|
|
|
list_del(&nh->router_list_node);
|
2017-09-25 16:32:28 +08:00
|
|
|
mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh);
|
2017-08-03 19:28:28 +08:00
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:21 +08:00
|
|
|
static bool mlxsw_sp_rt6_is_gateway(const struct mlxsw_sp *mlxsw_sp,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt)
|
2017-09-03 05:49:21 +08:00
|
|
|
{
|
2019-05-23 11:27:59 +08:00
|
|
|
return rt->fib6_nh->fib_nh_gw_family ||
|
2017-09-03 05:49:24 +08:00
|
|
|
mlxsw_sp_nexthop6_ipip_type(mlxsw_sp, rt, NULL);
|
2017-09-03 05:49:21 +08:00
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
static struct mlxsw_sp_nexthop_group *
|
|
|
|
mlxsw_sp_nexthop6_group_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp;
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
int i = 0;
|
|
|
|
int err;
|
|
|
|
|
2019-02-08 11:42:41 +08:00
|
|
|
nh_grp = kzalloc(struct_size(nh_grp, nexthops, fib6_entry->nrt6),
|
|
|
|
GFP_KERNEL);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (!nh_grp)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
INIT_LIST_HEAD(&nh_grp->fib_list);
|
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
|
|
|
nh_grp->neigh_tbl = &nd_tbl;
|
|
|
|
#endif
|
|
|
|
mlxsw_sp_rt6 = list_first_entry(&fib6_entry->rt6_list,
|
|
|
|
struct mlxsw_sp_rt6, list);
|
2017-09-03 05:49:21 +08:00
|
|
|
nh_grp->gateway = mlxsw_sp_rt6_is_gateway(mlxsw_sp, mlxsw_sp_rt6->rt);
|
2017-08-03 19:28:28 +08:00
|
|
|
nh_grp->count = fib6_entry->nrt6;
|
|
|
|
for (i = 0; i < nh_grp->count; i++) {
|
2018-04-18 08:33:26 +08:00
|
|
|
struct fib6_info *rt = mlxsw_sp_rt6->rt;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
err = mlxsw_sp_nexthop6_init(mlxsw_sp, nh_grp, nh, rt);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop6_init;
|
|
|
|
mlxsw_sp_rt6 = list_next_entry(mlxsw_sp_rt6, list);
|
|
|
|
}
|
2017-08-15 03:09:20 +08:00
|
|
|
|
|
|
|
err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop_group_insert;
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
|
|
|
|
return nh_grp;
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
err_nexthop_group_insert:
|
2017-08-03 19:28:28 +08:00
|
|
|
err_nexthop6_init:
|
|
|
|
for (i--; i >= 0; i--) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
mlxsw_sp_nexthop6_fini(mlxsw_sp, nh);
|
|
|
|
}
|
|
|
|
kfree(nh_grp);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_nexthop6_group_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop *nh;
|
|
|
|
int i = nh_grp->count;
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp);
|
2017-08-03 19:28:28 +08:00
|
|
|
for (i--; i >= 0; i--) {
|
|
|
|
nh = &nh_grp->nexthops[i];
|
|
|
|
mlxsw_sp_nexthop6_fini(mlxsw_sp, nh);
|
|
|
|
}
|
|
|
|
mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
|
|
|
|
WARN_ON(nh_grp->adj_index_valid);
|
|
|
|
kfree(nh_grp);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_nexthop6_group_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp;
|
|
|
|
|
2017-08-15 03:09:20 +08:00
|
|
|
nh_grp = mlxsw_sp_nexthop6_group_lookup(mlxsw_sp, fib6_entry);
|
|
|
|
if (!nh_grp) {
|
|
|
|
nh_grp = mlxsw_sp_nexthop6_group_create(mlxsw_sp, fib6_entry);
|
|
|
|
if (IS_ERR(nh_grp))
|
|
|
|
return PTR_ERR(nh_grp);
|
|
|
|
}
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
list_add_tail(&fib6_entry->common.nexthop_group_node,
|
|
|
|
&nh_grp->fib_list);
|
|
|
|
fib6_entry->common.nh_group = nh_grp;
|
|
|
|
|
2020-01-14 19:23:13 +08:00
|
|
|
/* The route and the nexthop are described by the same struct, so we
|
|
|
|
* need to the update the nexthop offload indication for the new route.
|
|
|
|
*/
|
|
|
|
__mlxsw_sp_nexthop6_group_offload_refresh(nh_grp, fib6_entry);
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_nexthop6_group_put(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
|
|
|
|
|
|
|
|
list_del(&fib_entry->nexthop_group_node);
|
|
|
|
if (!list_empty(&nh_grp->fib_list))
|
|
|
|
return;
|
|
|
|
mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, nh_grp);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_nexthop6_group_update(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_nexthop_group *old_nh_grp = fib6_entry->common.nh_group;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
fib6_entry->common.nh_group = NULL;
|
|
|
|
list_del(&fib6_entry->common.nexthop_group_node);
|
|
|
|
|
|
|
|
err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop6_group_get;
|
|
|
|
|
|
|
|
/* In case this entry is offloaded, then the adjacency index
|
|
|
|
* currently associated with it in the device's table is that
|
|
|
|
* of the old group. Start using the new one instead.
|
|
|
|
*/
|
2019-12-27 00:41:17 +08:00
|
|
|
err = mlxsw_sp_fib_entry_update(mlxsw_sp, &fib6_entry->common);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (err)
|
2019-12-27 00:41:17 +08:00
|
|
|
goto err_fib_entry_update;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
if (list_empty(&old_nh_grp->fib_list))
|
|
|
|
mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, old_nh_grp);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
err_fib_entry_update:
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common);
|
|
|
|
err_nexthop6_group_get:
|
|
|
|
list_add_tail(&fib6_entry->common.nexthop_group_node,
|
|
|
|
&old_nh_grp->fib_list);
|
|
|
|
fib6_entry->common.nh_group = old_nh_grp;
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_fib6_entry_nexthop_add(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry,
|
2019-06-18 23:12:55 +08:00
|
|
|
struct fib6_info **rt_arr, unsigned int nrt6)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
2019-06-18 23:12:55 +08:00
|
|
|
int err, i;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2019-06-18 23:12:55 +08:00
|
|
|
for (i = 0; i < nrt6; i++) {
|
|
|
|
mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt_arr[i]);
|
|
|
|
if (IS_ERR(mlxsw_sp_rt6)) {
|
|
|
|
err = PTR_ERR(mlxsw_sp_rt6);
|
|
|
|
goto err_rt6_create;
|
|
|
|
}
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2019-06-18 23:12:55 +08:00
|
|
|
list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list);
|
|
|
|
fib6_entry->nrt6++;
|
|
|
|
}
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
err = mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop6_group_update;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_nexthop6_group_update:
|
2019-06-18 23:12:55 +08:00
|
|
|
i = nrt6;
|
|
|
|
err_rt6_create:
|
|
|
|
for (i--; i >= 0; i--) {
|
|
|
|
fib6_entry->nrt6--;
|
|
|
|
mlxsw_sp_rt6 = list_last_entry(&fib6_entry->rt6_list,
|
|
|
|
struct mlxsw_sp_rt6, list);
|
|
|
|
list_del(&mlxsw_sp_rt6->list);
|
|
|
|
mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
|
|
|
|
}
|
2017-08-03 19:28:28 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_fib6_entry_nexthop_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry,
|
2019-06-18 23:12:55 +08:00
|
|
|
struct fib6_info **rt_arr, unsigned int nrt6)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
2019-06-18 23:12:55 +08:00
|
|
|
int i;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2019-06-18 23:12:55 +08:00
|
|
|
for (i = 0; i < nrt6; i++) {
|
|
|
|
mlxsw_sp_rt6 = mlxsw_sp_fib6_entry_rt_find(fib6_entry,
|
|
|
|
rt_arr[i]);
|
|
|
|
if (WARN_ON_ONCE(!mlxsw_sp_rt6))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
fib6_entry->nrt6--;
|
|
|
|
list_del(&mlxsw_sp_rt6->list);
|
|
|
|
mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
|
|
|
|
}
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry);
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:21 +08:00
|
|
|
static void mlxsw_sp_fib6_entry_type_set(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
/* Packets hitting RTF_REJECT routes need to be discarded by the
|
|
|
|
* stack. We can rely on their destination device not having a
|
|
|
|
* RIF (it's the loopback device) and can thus use action type
|
|
|
|
* local, which will cause them to be trapped with a lower
|
|
|
|
* priority than packets that need to be locally received.
|
|
|
|
*/
|
2018-04-19 06:38:59 +08:00
|
|
|
if (rt->fib6_flags & (RTF_LOCAL | RTF_ANYCAST))
|
2017-08-03 19:28:28 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
|
2019-02-07 03:42:01 +08:00
|
|
|
else if (rt->fib6_type == RTN_BLACKHOLE)
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE;
|
2018-04-19 06:38:59 +08:00
|
|
|
else if (rt->fib6_flags & RTF_REJECT)
|
2019-11-08 00:42:15 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE;
|
2017-09-03 05:49:21 +08:00
|
|
|
else if (mlxsw_sp_rt6_is_gateway(mlxsw_sp, rt))
|
2017-08-03 19:28:28 +08:00
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE;
|
|
|
|
else
|
|
|
|
fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_fib6_entry_rt_destroy_all(struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6, *tmp;
|
|
|
|
|
|
|
|
list_for_each_entry_safe(mlxsw_sp_rt6, tmp, &fib6_entry->rt6_list,
|
|
|
|
list) {
|
|
|
|
fib6_entry->nrt6--;
|
|
|
|
list_del(&mlxsw_sp_rt6->list);
|
|
|
|
mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fib6_entry *
|
|
|
|
mlxsw_sp_fib6_entry_create(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node,
|
2019-06-18 23:12:56 +08:00
|
|
|
struct fib6_info **rt_arr, unsigned int nrt6)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
struct mlxsw_sp_fib_entry *fib_entry;
|
|
|
|
struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
|
2019-06-18 23:12:56 +08:00
|
|
|
int err, i;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
fib6_entry = kzalloc(sizeof(*fib6_entry), GFP_KERNEL);
|
|
|
|
if (!fib6_entry)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
fib_entry = &fib6_entry->common;
|
|
|
|
|
2019-06-18 23:12:56 +08:00
|
|
|
INIT_LIST_HEAD(&fib6_entry->rt6_list);
|
|
|
|
|
|
|
|
for (i = 0; i < nrt6; i++) {
|
|
|
|
mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt_arr[i]);
|
|
|
|
if (IS_ERR(mlxsw_sp_rt6)) {
|
|
|
|
err = PTR_ERR(mlxsw_sp_rt6);
|
|
|
|
goto err_rt6_create;
|
|
|
|
}
|
|
|
|
list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list);
|
|
|
|
fib6_entry->nrt6++;
|
2017-08-03 19:28:28 +08:00
|
|
|
}
|
|
|
|
|
2019-06-18 23:12:56 +08:00
|
|
|
mlxsw_sp_fib6_entry_type_set(mlxsw_sp, fib_entry, rt_arr[0]);
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop6_group_get;
|
|
|
|
|
|
|
|
fib_entry->fib_node = fib_node;
|
|
|
|
|
|
|
|
return fib6_entry;
|
|
|
|
|
|
|
|
err_nexthop6_group_get:
|
2019-06-18 23:12:56 +08:00
|
|
|
i = nrt6;
|
2017-08-03 19:28:28 +08:00
|
|
|
err_rt6_create:
|
2019-06-18 23:12:56 +08:00
|
|
|
for (i--; i >= 0; i--) {
|
|
|
|
fib6_entry->nrt6--;
|
|
|
|
mlxsw_sp_rt6 = list_last_entry(&fib6_entry->rt6_list,
|
|
|
|
struct mlxsw_sp_rt6, list);
|
|
|
|
list_del(&mlxsw_sp_rt6->list);
|
|
|
|
mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
|
|
|
|
}
|
2017-08-03 19:28:28 +08:00
|
|
|
kfree(fib6_entry);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_fib6_entry_destroy(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common);
|
|
|
|
mlxsw_sp_fib6_entry_rt_destroy_all(fib6_entry);
|
|
|
|
WARN_ON(fib6_entry->nrt6);
|
|
|
|
kfree(fib6_entry);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fib6_entry *
|
|
|
|
mlxsw_sp_fib6_entry_lookup(struct mlxsw_sp *mlxsw_sp,
|
2018-04-18 08:33:26 +08:00
|
|
|
const struct fib6_info *rt)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
|
|
|
struct mlxsw_sp_fib *fib;
|
2019-12-27 00:41:17 +08:00
|
|
|
struct fib6_info *cmp_rt;
|
2017-08-03 19:28:28 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
2018-04-19 06:38:59 +08:00
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, rt->fib6_table->tb6_id);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (!vr)
|
|
|
|
return NULL;
|
|
|
|
fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
|
2018-04-19 06:38:59 +08:00
|
|
|
fib_node = mlxsw_sp_fib_node_lookup(fib, &rt->fib6_dst.addr,
|
|
|
|
sizeof(rt->fib6_dst.addr),
|
|
|
|
rt->fib6_dst.plen);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (!fib_node)
|
|
|
|
return NULL;
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
fib6_entry = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib6_entry, common);
|
|
|
|
cmp_rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
|
|
|
|
if (rt->fib6_table->tb6_id == cmp_rt->fib6_table->tb6_id &&
|
|
|
|
rt->fib6_metric == cmp_rt->fib6_metric &&
|
|
|
|
mlxsw_sp_fib6_entry_rt_find(fib6_entry, rt))
|
|
|
|
return fib6_entry;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2020-02-08 01:26:24 +08:00
|
|
|
static bool mlxsw_sp_fib6_allow_replace(struct mlxsw_sp_fib6_entry *fib6_entry)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_node *fib_node = fib6_entry->common.fib_node;
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_replaced;
|
|
|
|
struct fib6_info *rt, *rt_replaced;
|
|
|
|
|
|
|
|
if (!fib_node->fib_entry)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
fib6_replaced = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib6_entry,
|
|
|
|
common);
|
|
|
|
rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
|
|
|
|
rt_replaced = mlxsw_sp_fib6_entry_rt(fib6_replaced);
|
|
|
|
if (rt->fib6_table->tb6_id == RT_TABLE_MAIN &&
|
|
|
|
rt_replaced->fib6_table->tb6_id == RT_TABLE_LOCAL)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2019-12-23 21:28:19 +08:00
|
|
|
static int mlxsw_sp_router_fib6_replace(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct fib6_info **rt_arr,
|
|
|
|
unsigned int nrt6)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry, *fib6_replaced;
|
|
|
|
struct mlxsw_sp_fib_entry *replaced;
|
2017-08-03 19:28:28 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2019-06-18 23:12:54 +08:00
|
|
|
struct fib6_info *rt = rt_arr[0];
|
2017-08-03 19:28:28 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return 0;
|
|
|
|
|
2018-04-19 06:38:59 +08:00
|
|
|
if (rt->fib6_src.plen)
|
2017-08-03 19:28:30 +08:00
|
|
|
return -EINVAL;
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
if (mlxsw_sp_fib6_rt_should_ignore(rt))
|
|
|
|
return 0;
|
|
|
|
|
2018-04-19 06:38:59 +08:00
|
|
|
fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, rt->fib6_table->tb6_id,
|
|
|
|
&rt->fib6_dst.addr,
|
|
|
|
sizeof(rt->fib6_dst.addr),
|
|
|
|
rt->fib6_dst.plen,
|
2017-08-03 19:28:28 +08:00
|
|
|
MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
if (IS_ERR(fib_node))
|
|
|
|
return PTR_ERR(fib_node);
|
|
|
|
|
2019-06-18 23:12:56 +08:00
|
|
|
fib6_entry = mlxsw_sp_fib6_entry_create(mlxsw_sp, fib_node, rt_arr,
|
|
|
|
nrt6);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (IS_ERR(fib6_entry)) {
|
|
|
|
err = PTR_ERR(fib6_entry);
|
|
|
|
goto err_fib6_entry_create;
|
|
|
|
}
|
|
|
|
|
2020-02-08 01:26:24 +08:00
|
|
|
if (!mlxsw_sp_fib6_allow_replace(fib6_entry)) {
|
|
|
|
mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
|
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
replaced = fib_node->fib_entry;
|
2019-12-27 00:41:16 +08:00
|
|
|
err = mlxsw_sp_fib_node_entry_link(mlxsw_sp, &fib6_entry->common);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (err)
|
2019-12-27 00:41:16 +08:00
|
|
|
goto err_fib_node_entry_link;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
/* Nothing to replace */
|
|
|
|
if (!replaced)
|
|
|
|
return 0;
|
|
|
|
|
2020-01-14 19:23:14 +08:00
|
|
|
mlxsw_sp_fib_entry_hw_flags_clear(mlxsw_sp, replaced);
|
2019-12-27 00:41:17 +08:00
|
|
|
fib6_replaced = container_of(replaced, struct mlxsw_sp_fib6_entry,
|
|
|
|
common);
|
|
|
|
mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_replaced);
|
2017-08-03 19:28:29 +08:00
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
return 0;
|
|
|
|
|
2019-12-27 00:41:16 +08:00
|
|
|
err_fib_node_entry_link:
|
2019-12-27 00:41:17 +08:00
|
|
|
fib_node->fib_entry = replaced;
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
|
|
|
|
err_fib6_entry_create:
|
2019-12-23 21:28:19 +08:00
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_router_fib6_append(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct fib6_info **rt_arr,
|
|
|
|
unsigned int nrt6)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
|
|
|
struct fib6_info *rt = rt_arr[0];
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (rt->fib6_src.plen)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (mlxsw_sp_fib6_rt_should_ignore(rt))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, rt->fib6_table->tb6_id,
|
|
|
|
&rt->fib6_dst.addr,
|
|
|
|
sizeof(rt->fib6_dst.addr),
|
|
|
|
rt->fib6_dst.plen,
|
|
|
|
MLXSW_SP_L3_PROTO_IPV6);
|
|
|
|
if (IS_ERR(fib_node))
|
|
|
|
return PTR_ERR(fib_node);
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
if (WARN_ON_ONCE(!fib_node->fib_entry)) {
|
2019-12-23 21:28:19 +08:00
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
fib6_entry = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib6_entry, common);
|
2019-12-23 21:28:19 +08:00
|
|
|
err = mlxsw_sp_fib6_entry_nexthop_add(mlxsw_sp, fib6_entry, rt_arr,
|
|
|
|
nrt6);
|
|
|
|
if (err)
|
|
|
|
goto err_fib6_entry_nexthop_add;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
err_fib6_entry_nexthop_add:
|
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_fib6_del(struct mlxsw_sp *mlxsw_sp,
|
2019-06-18 23:12:54 +08:00
|
|
|
struct fib6_info **rt_arr,
|
|
|
|
unsigned int nrt6)
|
2017-08-03 19:28:28 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
|
|
|
struct mlxsw_sp_fib_node *fib_node;
|
2019-06-18 23:12:54 +08:00
|
|
|
struct fib6_info *rt = rt_arr[0];
|
2017-08-03 19:28:28 +08:00
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (mlxsw_sp_fib6_rt_should_ignore(rt))
|
|
|
|
return;
|
|
|
|
|
2019-12-09 14:55:20 +08:00
|
|
|
/* Multipath routes are first added to the FIB trie and only then
|
|
|
|
* notified. If we vetoed the addition, we will get a delete
|
|
|
|
* notification for a route we do not have. Therefore, do not warn if
|
|
|
|
* route was not found.
|
|
|
|
*/
|
2017-08-03 19:28:28 +08:00
|
|
|
fib6_entry = mlxsw_sp_fib6_entry_lookup(mlxsw_sp, rt);
|
2019-12-09 14:55:20 +08:00
|
|
|
if (!fib6_entry)
|
2017-08-03 19:28:28 +08:00
|
|
|
return;
|
|
|
|
|
2019-06-18 23:12:55 +08:00
|
|
|
/* If not all the nexthops are deleted, then only reduce the nexthop
|
|
|
|
* group.
|
2017-08-03 19:28:28 +08:00
|
|
|
*/
|
2019-06-18 23:12:55 +08:00
|
|
|
if (nrt6 != fib6_entry->nrt6) {
|
|
|
|
mlxsw_sp_fib6_entry_nexthop_del(mlxsw_sp, fib6_entry, rt_arr,
|
|
|
|
nrt6);
|
2017-08-03 19:28:28 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
fib_node = fib6_entry->common.fib_node;
|
|
|
|
|
2019-12-27 00:41:16 +08:00
|
|
|
mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, &fib6_entry->common);
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
|
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
static int __mlxsw_sp_router_set_abort_trap(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
enum mlxsw_reg_ralxx_protocol proto,
|
|
|
|
u8 tree_id)
|
2016-09-26 18:52:31 +08:00
|
|
|
{
|
|
|
|
char ralta_pl[MLXSW_REG_RALTA_LEN];
|
|
|
|
char ralst_pl[MLXSW_REG_RALST_LEN];
|
2017-03-10 15:53:43 +08:00
|
|
|
int i, err;
|
2016-09-26 18:52:31 +08:00
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
mlxsw_reg_ralta_pack(ralta_pl, true, proto, tree_id);
|
2016-09-26 18:52:31 +08:00
|
|
|
err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
mlxsw_reg_ralst_pack(ralst_pl, 0xff, tree_id);
|
2016-09-26 18:52:31 +08:00
|
|
|
err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-03-10 15:53:43 +08:00
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
|
2017-03-10 15:53:43 +08:00
|
|
|
char raltb_pl[MLXSW_REG_RALTB_LEN];
|
|
|
|
char ralue_pl[MLXSW_REG_RALUE_LEN];
|
2016-09-26 18:52:31 +08:00
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
mlxsw_reg_raltb_pack(raltb_pl, vr->id, proto, tree_id);
|
2017-03-10 15:53:43 +08:00
|
|
|
err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb),
|
|
|
|
raltb_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
mlxsw_reg_ralue_pack(ralue_pl, proto,
|
|
|
|
MLXSW_REG_RALUE_OP_WRITE_WRITE, vr->id, 0);
|
2017-03-10 15:53:43 +08:00
|
|
|
mlxsw_reg_ralue_act_ip2me_pack(ralue_pl);
|
|
|
|
err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue),
|
|
|
|
ralue_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|
|
|
|
|
2018-03-26 20:01:42 +08:00
|
|
|
static struct mlxsw_sp_mr_table *
|
|
|
|
mlxsw_sp_router_fibmr_family_to_table(struct mlxsw_sp_vr *vr, int family)
|
|
|
|
{
|
2018-03-26 20:01:44 +08:00
|
|
|
if (family == RTNL_FAMILY_IPMR)
|
2018-03-26 20:01:42 +08:00
|
|
|
return vr->mr_table[MLXSW_SP_L3_PROTO_IPV4];
|
2018-03-26 20:01:44 +08:00
|
|
|
else
|
|
|
|
return vr->mr_table[MLXSW_SP_L3_PROTO_IPV6];
|
2018-03-26 20:01:42 +08:00
|
|
|
}
|
|
|
|
|
2017-09-27 14:23:20 +08:00
|
|
|
static int mlxsw_sp_router_fibmr_add(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mfc_entry_notifier_info *men_info,
|
|
|
|
bool replace)
|
|
|
|
{
|
2018-03-26 20:01:42 +08:00
|
|
|
struct mlxsw_sp_mr_table *mrt;
|
2017-09-27 14:23:20 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return 0;
|
|
|
|
|
2017-10-19 00:56:56 +08:00
|
|
|
vr = mlxsw_sp_vr_get(mlxsw_sp, men_info->tb_id, NULL);
|
2017-09-27 14:23:20 +08:00
|
|
|
if (IS_ERR(vr))
|
|
|
|
return PTR_ERR(vr);
|
|
|
|
|
2018-03-26 20:01:42 +08:00
|
|
|
mrt = mlxsw_sp_router_fibmr_family_to_table(vr, men_info->info.family);
|
|
|
|
return mlxsw_sp_mr_route_add(mrt, men_info->mfc, replace);
|
2017-09-27 14:23:20 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_fibmr_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mfc_entry_notifier_info *men_info)
|
|
|
|
{
|
2018-03-26 20:01:42 +08:00
|
|
|
struct mlxsw_sp_mr_table *mrt;
|
2017-09-27 14:23:20 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return;
|
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, men_info->tb_id);
|
|
|
|
if (WARN_ON(!vr))
|
|
|
|
return;
|
|
|
|
|
2018-03-26 20:01:42 +08:00
|
|
|
mrt = mlxsw_sp_router_fibmr_family_to_table(vr, men_info->info.family);
|
|
|
|
mlxsw_sp_mr_route_del(mrt, men_info->mfc);
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
2017-09-27 14:23:20 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
mlxsw_sp_router_fibmr_vif_add(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct vif_entry_notifier_info *ven_info)
|
|
|
|
{
|
2018-03-26 20:01:42 +08:00
|
|
|
struct mlxsw_sp_mr_table *mrt;
|
2017-09-27 14:23:20 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return 0;
|
|
|
|
|
2017-10-19 00:56:56 +08:00
|
|
|
vr = mlxsw_sp_vr_get(mlxsw_sp, ven_info->tb_id, NULL);
|
2017-09-27 14:23:20 +08:00
|
|
|
if (IS_ERR(vr))
|
|
|
|
return PTR_ERR(vr);
|
|
|
|
|
2018-03-26 20:01:42 +08:00
|
|
|
mrt = mlxsw_sp_router_fibmr_family_to_table(vr, ven_info->info.family);
|
2017-09-27 14:23:20 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, ven_info->dev);
|
2018-03-26 20:01:42 +08:00
|
|
|
return mlxsw_sp_mr_vif_add(mrt, ven_info->dev,
|
2017-09-27 14:23:20 +08:00
|
|
|
ven_info->vif_index,
|
|
|
|
ven_info->vif_flags, rif);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_router_fibmr_vif_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct vif_entry_notifier_info *ven_info)
|
|
|
|
{
|
2018-03-26 20:01:42 +08:00
|
|
|
struct mlxsw_sp_mr_table *mrt;
|
2017-09-27 14:23:20 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return;
|
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_find(mlxsw_sp, ven_info->tb_id);
|
|
|
|
if (WARN_ON(!vr))
|
|
|
|
return;
|
|
|
|
|
2018-03-26 20:01:42 +08:00
|
|
|
mrt = mlxsw_sp_router_fibmr_family_to_table(vr, ven_info->info.family);
|
|
|
|
mlxsw_sp_mr_vif_del(mrt, ven_info->vif_index);
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
2017-09-27 14:23:20 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
static int mlxsw_sp_router_set_abort_trap(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
enum mlxsw_reg_ralxx_protocol proto = MLXSW_REG_RALXX_PROTOCOL_IPV4;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = __mlxsw_sp_router_set_abort_trap(mlxsw_sp, proto,
|
|
|
|
MLXSW_SP_LPM_TREE_MIN);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-09-27 14:23:20 +08:00
|
|
|
/* The multicast router code does not need an abort trap as by default,
|
|
|
|
* packets that don't match any routes are trapped to the CPU.
|
|
|
|
*/
|
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
proto = MLXSW_REG_RALXX_PROTOCOL_IPV6;
|
|
|
|
return __mlxsw_sp_router_set_abort_trap(mlxsw_sp, proto,
|
|
|
|
MLXSW_SP_LPM_TREE_MIN + 1);
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
static void mlxsw_sp_fib4_node_flush(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib4_entry *fib4_entry;
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
fib4_entry = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib4_entry, common);
|
|
|
|
mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, fib_node->fib_entry);
|
|
|
|
mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
|
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:28 +08:00
|
|
|
static void mlxsw_sp_fib6_node_flush(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
2019-12-27 00:41:17 +08:00
|
|
|
struct mlxsw_sp_fib6_entry *fib6_entry;
|
2017-08-03 19:28:28 +08:00
|
|
|
|
2019-12-27 00:41:17 +08:00
|
|
|
fib6_entry = container_of(fib_node->fib_entry,
|
|
|
|
struct mlxsw_sp_fib6_entry, common);
|
|
|
|
mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, fib_node->fib_entry);
|
|
|
|
mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
|
|
|
|
mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
|
2017-08-03 19:28:28 +08:00
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
static void mlxsw_sp_fib_node_flush(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_fib_node *fib_node)
|
|
|
|
{
|
2017-03-10 15:53:41 +08:00
|
|
|
switch (fib_node->fib->proto) {
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
case MLXSW_SP_L3_PROTO_IPV4:
|
|
|
|
mlxsw_sp_fib4_node_flush(mlxsw_sp, fib_node);
|
|
|
|
break;
|
|
|
|
case MLXSW_SP_L3_PROTO_IPV6:
|
2017-08-03 19:28:28 +08:00
|
|
|
mlxsw_sp_fib6_node_flush(mlxsw_sp, fib_node);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
static void mlxsw_sp_vr_fib_flush(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_vr *vr,
|
|
|
|
enum mlxsw_sp_l3proto proto)
|
2016-09-26 18:52:31 +08:00
|
|
|
{
|
2017-03-10 15:53:41 +08:00
|
|
|
struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
|
mlxsw: spectrum_router: Correctly handle identical routes
In the device, routes are indexed in a routing table based on the prefix
and its length. This is in contrast to the kernel's FIB where several
FIB aliases can exist with these parameters being identical. In such
cases, the routes will be sorted by table ID (LOCAL first, then MAIN),
TOS and finally priority (metric).
During lookup, these routes will be evaluated in order. In case the
packet's TOS field is non-zero and a FIB alias with a matching TOS is
found, then it's selected. Otherwise, the lookup defaults to the route
with TOS 0 (if it exists). However, if the requested scope is narrower
than the one found, then the lookup continues.
To best reflect the kernel's datapath we should take the above into
account. Given a prefix and its length, the reflected route will always
be the first one in the FIB alias list. However, if the route has a
non-zero TOS then its action will be converted to trap instead of
forward, since we currently don't support TOS-based routing. If this
turns out to be a real issue, we can add support for that using
policy-based switching.
The route's scope can be effectively ignored as any packet being routed
by the device would've been looked-up using the widest scope (UNIVERSE).
To achieve that we need to do two changes. Firstly, we need to create
another struct (FIB node) that will hold the list of FIB entries sharing
the same prefix and length. This struct will be hashed using these two
parameters.
Secondly, we need to change the route reflection to match the above
logic, so that the first FIB entry in the list will be programmed into
the device while the rest will remain in the driver's cache in case of
subsequent changes.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-09 17:28:42 +08:00
|
|
|
struct mlxsw_sp_fib_node *fib_node, *tmp;
|
2017-03-10 15:53:41 +08:00
|
|
|
|
|
|
|
list_for_each_entry_safe(fib_node, tmp, &fib->node_list, list) {
|
|
|
|
bool do_break = &tmp->list == &fib->node_list;
|
|
|
|
|
|
|
|
mlxsw_sp_fib_node_flush(mlxsw_sp, fib_node);
|
|
|
|
if (do_break)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2018-03-26 20:01:40 +08:00
|
|
|
int i, j;
|
2016-09-26 18:52:31 +08:00
|
|
|
|
2016-10-21 22:07:23 +08:00
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
|
2016-11-14 18:26:32 +08:00
|
|
|
|
2017-03-10 15:53:41 +08:00
|
|
|
if (!mlxsw_sp_vr_is_used(vr))
|
2016-09-26 18:52:31 +08:00
|
|
|
continue;
|
2017-09-27 14:23:20 +08:00
|
|
|
|
2018-03-26 20:01:40 +08:00
|
|
|
for (j = 0; j < MLXSW_SP_L3_PROTO_MAX; j++)
|
|
|
|
mlxsw_sp_mr_table_flush(vr->mr_table[j]);
|
2017-03-10 15:53:41 +08:00
|
|
|
mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4);
|
2017-07-18 16:10:22 +08:00
|
|
|
|
|
|
|
/* If virtual router was only used for IPv4, then it's no
|
|
|
|
* longer used.
|
|
|
|
*/
|
|
|
|
if (!mlxsw_sp_vr_is_used(vr))
|
|
|
|
continue;
|
|
|
|
mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6);
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|
2019-11-14 17:54:19 +08:00
|
|
|
|
|
|
|
/* After flushing all the routes, it is not possible anyone is still
|
|
|
|
* using the adjacency index that is discarding packets, so free it in
|
|
|
|
* case it was allocated.
|
|
|
|
*/
|
|
|
|
if (!mlxsw_sp->router->adj_discard_index_valid)
|
|
|
|
return;
|
|
|
|
mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1,
|
|
|
|
mlxsw_sp->router->adj_discard_index);
|
|
|
|
mlxsw_sp->router->adj_discard_index_valid = false;
|
2016-11-14 18:26:32 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:25 +08:00
|
|
|
static void mlxsw_sp_router_fib_abort(struct mlxsw_sp *mlxsw_sp)
|
2016-11-14 18:26:32 +08:00
|
|
|
{
|
|
|
|
int err;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
if (mlxsw_sp->router->aborted)
|
2016-11-16 16:51:58 +08:00
|
|
|
return;
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "FIB abort triggered. Note that FIB entries are no longer being offloaded to this device.\n");
|
2016-11-14 18:26:32 +08:00
|
|
|
mlxsw_sp_router_fib_flush(mlxsw_sp);
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp->router->aborted = true;
|
2016-09-26 18:52:31 +08:00
|
|
|
err = mlxsw_sp_router_set_abort_trap(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
dev_warn(mlxsw_sp->bus_info->dev, "Failed to set abort trap.\n");
|
|
|
|
}
|
|
|
|
|
2019-06-18 23:12:52 +08:00
|
|
|
struct mlxsw_sp_fib6_event_work {
|
|
|
|
struct fib6_info **rt_arr;
|
|
|
|
unsigned int nrt6;
|
|
|
|
};
|
|
|
|
|
2016-12-03 23:45:01 +08:00
|
|
|
struct mlxsw_sp_fib_event_work {
|
2017-02-06 23:20:10 +08:00
|
|
|
struct work_struct work;
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
union {
|
2019-06-18 23:12:52 +08:00
|
|
|
struct mlxsw_sp_fib6_event_work fib6_work;
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
struct fib_entry_notifier_info fen_info;
|
2017-03-16 16:08:14 +08:00
|
|
|
struct fib_rule_notifier_info fr_info;
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
struct fib_nh_notifier_info fnh_info;
|
2017-09-27 14:23:20 +08:00
|
|
|
struct mfc_entry_notifier_info men_info;
|
|
|
|
struct vif_entry_notifier_info ven_info;
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
};
|
2016-12-03 23:45:01 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
unsigned long event;
|
|
|
|
};
|
|
|
|
|
2019-06-18 23:12:52 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_router_fib6_work_init(struct mlxsw_sp_fib6_event_work *fib6_work,
|
|
|
|
struct fib6_entry_notifier_info *fen6_info)
|
|
|
|
{
|
|
|
|
struct fib6_info *rt = fen6_info->rt;
|
|
|
|
struct fib6_info **rt_arr;
|
|
|
|
struct fib6_info *iter;
|
|
|
|
unsigned int nrt6;
|
|
|
|
int i = 0;
|
|
|
|
|
|
|
|
nrt6 = fen6_info->nsiblings + 1;
|
|
|
|
|
|
|
|
rt_arr = kcalloc(nrt6, sizeof(struct fib6_info *), GFP_ATOMIC);
|
|
|
|
if (!rt_arr)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
fib6_work->rt_arr = rt_arr;
|
|
|
|
fib6_work->nrt6 = nrt6;
|
|
|
|
|
|
|
|
rt_arr[0] = rt;
|
|
|
|
fib6_info_hold(rt);
|
|
|
|
|
|
|
|
if (!fen6_info->nsiblings)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
list_for_each_entry(iter, &rt->fib6_siblings, fib6_siblings) {
|
|
|
|
if (i == fen6_info->nsiblings)
|
|
|
|
break;
|
|
|
|
|
|
|
|
rt_arr[i + 1] = iter;
|
|
|
|
fib6_info_hold(iter);
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
WARN_ON_ONCE(i != fen6_info->nsiblings);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_router_fib6_work_fini(struct mlxsw_sp_fib6_event_work *fib6_work)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < fib6_work->nrt6; i++)
|
|
|
|
mlxsw_sp_rt6_release(fib6_work->rt_arr[i]);
|
|
|
|
kfree(fib6_work->rt_arr);
|
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:26 +08:00
|
|
|
static void mlxsw_sp_router_fib4_event_work(struct work_struct *work)
|
2016-09-26 18:52:31 +08:00
|
|
|
{
|
2016-12-03 23:45:01 +08:00
|
|
|
struct mlxsw_sp_fib_event_work *fib_work =
|
2017-02-06 23:20:10 +08:00
|
|
|
container_of(work, struct mlxsw_sp_fib_event_work, work);
|
2016-12-03 23:45:01 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
|
2016-09-26 18:52:31 +08:00
|
|
|
int err;
|
|
|
|
|
2016-12-03 23:45:01 +08:00
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2018-02-27 21:53:46 +08:00
|
|
|
mlxsw_sp_span_respin(mlxsw_sp);
|
|
|
|
|
2016-12-03 23:45:01 +08:00
|
|
|
switch (fib_work->event) {
|
2019-12-14 23:53:15 +08:00
|
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
2019-12-14 23:53:14 +08:00
|
|
|
err = mlxsw_sp_router_fib4_replace(mlxsw_sp,
|
|
|
|
&fib_work->fen_info);
|
2016-09-26 18:52:31 +08:00
|
|
|
if (err)
|
2017-07-18 16:10:25 +08:00
|
|
|
mlxsw_sp_router_fib_abort(mlxsw_sp);
|
2016-12-03 23:45:01 +08:00
|
|
|
fib_info_put(fib_work->fen_info.fi);
|
2016-09-26 18:52:31 +08:00
|
|
|
break;
|
2019-12-14 23:53:15 +08:00
|
|
|
case FIB_EVENT_ENTRY_DEL:
|
2016-12-03 23:45:01 +08:00
|
|
|
mlxsw_sp_router_fib4_del(mlxsw_sp, &fib_work->fen_info);
|
|
|
|
fib_info_put(fib_work->fen_info.fi);
|
2016-09-26 18:52:31 +08:00
|
|
|
break;
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
case FIB_EVENT_NH_ADD: /* fall through */
|
|
|
|
case FIB_EVENT_NH_DEL:
|
2017-07-18 16:10:27 +08:00
|
|
|
mlxsw_sp_nexthop4_event(mlxsw_sp, fib_work->event,
|
|
|
|
fib_work->fnh_info.fib_nh);
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
fib_info_put(fib_work->fnh_info.fib_nh->nh_parent);
|
|
|
|
break;
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2016-12-03 23:45:01 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
kfree(fib_work);
|
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:26 +08:00
|
|
|
static void mlxsw_sp_router_fib6_event_work(struct work_struct *work)
|
|
|
|
{
|
2017-08-03 19:28:27 +08:00
|
|
|
struct mlxsw_sp_fib_event_work *fib_work =
|
|
|
|
container_of(work, struct mlxsw_sp_fib_event_work, work);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
|
2017-08-03 19:28:28 +08:00
|
|
|
int err;
|
2017-08-03 19:28:27 +08:00
|
|
|
|
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2018-02-27 21:53:46 +08:00
|
|
|
mlxsw_sp_span_respin(mlxsw_sp);
|
|
|
|
|
2017-08-03 19:28:27 +08:00
|
|
|
switch (fib_work->event) {
|
2019-12-23 21:28:20 +08:00
|
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
2019-12-23 21:28:19 +08:00
|
|
|
err = mlxsw_sp_router_fib6_replace(mlxsw_sp,
|
|
|
|
fib_work->fib6_work.rt_arr,
|
|
|
|
fib_work->fib6_work.nrt6);
|
2017-08-03 19:28:28 +08:00
|
|
|
if (err)
|
|
|
|
mlxsw_sp_router_fib_abort(mlxsw_sp);
|
2019-06-18 23:12:52 +08:00
|
|
|
mlxsw_sp_router_fib6_work_fini(&fib_work->fib6_work);
|
2017-08-03 19:28:28 +08:00
|
|
|
break;
|
2019-12-23 21:28:19 +08:00
|
|
|
case FIB_EVENT_ENTRY_APPEND:
|
|
|
|
err = mlxsw_sp_router_fib6_append(mlxsw_sp,
|
|
|
|
fib_work->fib6_work.rt_arr,
|
|
|
|
fib_work->fib6_work.nrt6);
|
|
|
|
if (err)
|
|
|
|
mlxsw_sp_router_fib_abort(mlxsw_sp);
|
|
|
|
mlxsw_sp_router_fib6_work_fini(&fib_work->fib6_work);
|
|
|
|
break;
|
2019-12-23 21:28:20 +08:00
|
|
|
case FIB_EVENT_ENTRY_DEL:
|
2019-06-18 23:12:52 +08:00
|
|
|
mlxsw_sp_router_fib6_del(mlxsw_sp,
|
2019-06-18 23:12:54 +08:00
|
|
|
fib_work->fib6_work.rt_arr,
|
|
|
|
fib_work->fib6_work.nrt6);
|
2019-06-18 23:12:52 +08:00
|
|
|
mlxsw_sp_router_fib6_work_fini(&fib_work->fib6_work);
|
2017-08-03 19:28:28 +08:00
|
|
|
break;
|
2017-08-03 19:28:27 +08:00
|
|
|
}
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-08-03 19:28:27 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
kfree(fib_work);
|
2017-08-03 19:28:26 +08:00
|
|
|
}
|
|
|
|
|
2017-09-27 14:23:20 +08:00
|
|
|
static void mlxsw_sp_router_fibmr_event_work(struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_event_work *fib_work =
|
|
|
|
container_of(work, struct mlxsw_sp_fib_event_work, work);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
|
|
|
|
bool replace;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-09-27 14:23:20 +08:00
|
|
|
switch (fib_work->event) {
|
|
|
|
case FIB_EVENT_ENTRY_REPLACE: /* fall through */
|
|
|
|
case FIB_EVENT_ENTRY_ADD:
|
|
|
|
replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
|
|
|
|
|
|
|
|
err = mlxsw_sp_router_fibmr_add(mlxsw_sp, &fib_work->men_info,
|
|
|
|
replace);
|
|
|
|
if (err)
|
|
|
|
mlxsw_sp_router_fib_abort(mlxsw_sp);
|
2018-03-26 20:01:36 +08:00
|
|
|
mr_cache_put(fib_work->men_info.mfc);
|
2017-09-27 14:23:20 +08:00
|
|
|
break;
|
|
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
|
|
mlxsw_sp_router_fibmr_del(mlxsw_sp, &fib_work->men_info);
|
2018-03-26 20:01:36 +08:00
|
|
|
mr_cache_put(fib_work->men_info.mfc);
|
2017-09-27 14:23:20 +08:00
|
|
|
break;
|
|
|
|
case FIB_EVENT_VIF_ADD:
|
|
|
|
err = mlxsw_sp_router_fibmr_vif_add(mlxsw_sp,
|
|
|
|
&fib_work->ven_info);
|
|
|
|
if (err)
|
|
|
|
mlxsw_sp_router_fib_abort(mlxsw_sp);
|
|
|
|
dev_put(fib_work->ven_info.dev);
|
|
|
|
break;
|
|
|
|
case FIB_EVENT_VIF_DEL:
|
|
|
|
mlxsw_sp_router_fibmr_vif_del(mlxsw_sp,
|
|
|
|
&fib_work->ven_info);
|
|
|
|
dev_put(fib_work->ven_info.dev);
|
|
|
|
break;
|
|
|
|
}
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-09-27 14:23:20 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
kfree(fib_work);
|
|
|
|
}
|
|
|
|
|
2017-08-03 19:28:26 +08:00
|
|
|
static void mlxsw_sp_router_fib4_event(struct mlxsw_sp_fib_event_work *fib_work,
|
|
|
|
struct fib_notifier_info *info)
|
|
|
|
{
|
2017-10-19 06:01:38 +08:00
|
|
|
struct fib_entry_notifier_info *fen_info;
|
|
|
|
struct fib_nh_notifier_info *fnh_info;
|
|
|
|
|
2017-08-03 19:28:26 +08:00
|
|
|
switch (fib_work->event) {
|
2019-12-14 23:53:15 +08:00
|
|
|
case FIB_EVENT_ENTRY_REPLACE: /* fall through */
|
|
|
|
case FIB_EVENT_ENTRY_DEL:
|
2017-10-19 06:01:38 +08:00
|
|
|
fen_info = container_of(info, struct fib_entry_notifier_info,
|
|
|
|
info);
|
|
|
|
fib_work->fen_info = *fen_info;
|
|
|
|
/* Take reference on fib_info to prevent it from being
|
2017-08-03 19:28:26 +08:00
|
|
|
* freed while work is queued. Release it afterwards.
|
|
|
|
*/
|
|
|
|
fib_info_hold(fib_work->fen_info.fi);
|
|
|
|
break;
|
|
|
|
case FIB_EVENT_NH_ADD: /* fall through */
|
|
|
|
case FIB_EVENT_NH_DEL:
|
2017-10-19 06:01:38 +08:00
|
|
|
fnh_info = container_of(info, struct fib_nh_notifier_info,
|
|
|
|
info);
|
|
|
|
fib_work->fnh_info = *fnh_info;
|
2017-08-03 19:28:26 +08:00
|
|
|
fib_info_hold(fib_work->fnh_info.fib_nh->nh_parent);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-06-18 23:12:51 +08:00
|
|
|
static int mlxsw_sp_router_fib6_event(struct mlxsw_sp_fib_event_work *fib_work,
|
|
|
|
struct fib_notifier_info *info)
|
2017-08-03 19:28:26 +08:00
|
|
|
{
|
2017-10-19 06:01:38 +08:00
|
|
|
struct fib6_entry_notifier_info *fen6_info;
|
2019-06-18 23:12:52 +08:00
|
|
|
int err;
|
2017-10-19 06:01:38 +08:00
|
|
|
|
2017-08-03 19:28:27 +08:00
|
|
|
switch (fib_work->event) {
|
2019-12-23 21:28:20 +08:00
|
|
|
case FIB_EVENT_ENTRY_REPLACE: /* fall through */
|
2019-12-23 21:28:19 +08:00
|
|
|
case FIB_EVENT_ENTRY_APPEND: /* fall through */
|
2019-12-23 21:28:20 +08:00
|
|
|
case FIB_EVENT_ENTRY_DEL:
|
2017-10-19 06:01:38 +08:00
|
|
|
fen6_info = container_of(info, struct fib6_entry_notifier_info,
|
|
|
|
info);
|
2019-06-18 23:12:52 +08:00
|
|
|
err = mlxsw_sp_router_fib6_work_init(&fib_work->fib6_work,
|
|
|
|
fen6_info);
|
|
|
|
if (err)
|
|
|
|
return err;
|
2017-08-03 19:28:28 +08:00
|
|
|
break;
|
2017-08-03 19:28:27 +08:00
|
|
|
}
|
2019-06-18 23:12:51 +08:00
|
|
|
|
|
|
|
return 0;
|
2017-08-03 19:28:26 +08:00
|
|
|
}
|
|
|
|
|
2017-09-27 14:23:20 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_router_fibmr_event(struct mlxsw_sp_fib_event_work *fib_work,
|
|
|
|
struct fib_notifier_info *info)
|
|
|
|
{
|
|
|
|
switch (fib_work->event) {
|
|
|
|
case FIB_EVENT_ENTRY_REPLACE: /* fall through */
|
|
|
|
case FIB_EVENT_ENTRY_ADD: /* fall through */
|
|
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
|
|
memcpy(&fib_work->men_info, info, sizeof(fib_work->men_info));
|
2018-03-26 20:01:36 +08:00
|
|
|
mr_cache_hold(fib_work->men_info.mfc);
|
2017-09-27 14:23:20 +08:00
|
|
|
break;
|
|
|
|
case FIB_EVENT_VIF_ADD: /* fall through */
|
|
|
|
case FIB_EVENT_VIF_DEL:
|
|
|
|
memcpy(&fib_work->ven_info, info, sizeof(fib_work->ven_info));
|
|
|
|
dev_hold(fib_work->ven_info.dev);
|
|
|
|
break;
|
2017-10-28 08:37:14 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_router_fib_rule_event(unsigned long event,
|
|
|
|
struct fib_notifier_info *info,
|
|
|
|
struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
struct netlink_ext_ack *extack = info->extack;
|
|
|
|
struct fib_rule_notifier_info *fr_info;
|
|
|
|
struct fib_rule *rule;
|
|
|
|
int err = 0;
|
|
|
|
|
|
|
|
/* nothing to do at the moment */
|
|
|
|
if (event == FIB_EVENT_RULE_DEL)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (mlxsw_sp->router->aborted)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
fr_info = container_of(info, struct fib_rule_notifier_info, info);
|
|
|
|
rule = fr_info->rule;
|
|
|
|
|
2019-04-21 15:18:36 +08:00
|
|
|
/* Rule only affects locally generated traffic */
|
2019-10-03 17:49:32 +08:00
|
|
|
if (rule->iifindex == mlxsw_sp_net(mlxsw_sp)->loopback_dev->ifindex)
|
2019-04-21 15:18:36 +08:00
|
|
|
return 0;
|
|
|
|
|
2017-10-28 08:37:14 +08:00
|
|
|
switch (info->family) {
|
|
|
|
case AF_INET:
|
|
|
|
if (!fib4_rule_default(rule) && !rule->l3mdev)
|
2018-05-02 15:17:34 +08:00
|
|
|
err = -EOPNOTSUPP;
|
2017-10-28 08:37:14 +08:00
|
|
|
break;
|
|
|
|
case AF_INET6:
|
|
|
|
if (!fib6_rule_default(rule) && !rule->l3mdev)
|
2018-05-02 15:17:34 +08:00
|
|
|
err = -EOPNOTSUPP;
|
2017-10-28 08:37:14 +08:00
|
|
|
break;
|
|
|
|
case RTNL_FAMILY_IPMR:
|
|
|
|
if (!ipmr_rule_default(rule) && !rule->l3mdev)
|
2018-05-02 15:17:34 +08:00
|
|
|
err = -EOPNOTSUPP;
|
2017-09-27 14:23:20 +08:00
|
|
|
break;
|
2018-03-26 20:01:44 +08:00
|
|
|
case RTNL_FAMILY_IP6MR:
|
|
|
|
if (!ip6mr_rule_default(rule) && !rule->l3mdev)
|
2018-05-02 15:17:34 +08:00
|
|
|
err = -EOPNOTSUPP;
|
2018-03-26 20:01:44 +08:00
|
|
|
break;
|
2017-09-27 14:23:20 +08:00
|
|
|
}
|
2017-10-28 08:37:14 +08:00
|
|
|
|
|
|
|
if (err < 0)
|
2018-05-02 15:17:34 +08:00
|
|
|
NL_SET_ERR_MSG_MOD(extack, "FIB rules not supported");
|
2017-10-28 08:37:14 +08:00
|
|
|
|
|
|
|
return err;
|
2017-09-27 14:23:20 +08:00
|
|
|
}
|
|
|
|
|
2016-12-03 23:45:01 +08:00
|
|
|
/* Called with rcu_read_lock() */
|
|
|
|
static int mlxsw_sp_router_fib_event(struct notifier_block *nb,
|
|
|
|
unsigned long event, void *ptr)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_fib_event_work *fib_work;
|
|
|
|
struct fib_notifier_info *info = ptr;
|
2017-05-17 01:38:28 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2017-10-28 08:37:14 +08:00
|
|
|
int err;
|
2016-12-03 23:45:01 +08:00
|
|
|
|
2019-10-03 17:49:27 +08:00
|
|
|
if ((info->family != AF_INET && info->family != AF_INET6 &&
|
2018-03-26 20:01:44 +08:00
|
|
|
info->family != RTNL_FAMILY_IPMR &&
|
|
|
|
info->family != RTNL_FAMILY_IP6MR))
|
2016-12-03 23:45:01 +08:00
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
2017-10-28 08:37:14 +08:00
|
|
|
router = container_of(nb, struct mlxsw_sp_router, fib_nb);
|
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case FIB_EVENT_RULE_ADD: /* fall through */
|
|
|
|
case FIB_EVENT_RULE_DEL:
|
|
|
|
err = mlxsw_sp_router_fib_rule_event(event, info,
|
|
|
|
router->mlxsw_sp);
|
2019-10-03 17:49:29 +08:00
|
|
|
return notifier_from_errno(err);
|
2019-12-14 23:53:14 +08:00
|
|
|
case FIB_EVENT_ENTRY_ADD: /* fall through */
|
2019-12-23 21:28:19 +08:00
|
|
|
case FIB_EVENT_ENTRY_REPLACE: /* fall through */
|
|
|
|
case FIB_EVENT_ENTRY_APPEND:
|
2018-05-02 15:17:35 +08:00
|
|
|
if (router->aborted) {
|
|
|
|
NL_SET_ERR_MSG_MOD(info->extack, "FIB offload was aborted. Not configuring route");
|
|
|
|
return notifier_from_errno(-EINVAL);
|
|
|
|
}
|
2019-04-06 07:30:39 +08:00
|
|
|
if (info->family == AF_INET) {
|
|
|
|
struct fib_entry_notifier_info *fen_info = ptr;
|
|
|
|
|
|
|
|
if (fen_info->fi->fib_nh_is_v6) {
|
|
|
|
NL_SET_ERR_MSG_MOD(info->extack, "IPv6 gateway with IPv4 route is not supported");
|
|
|
|
return notifier_from_errno(-EINVAL);
|
|
|
|
}
|
2019-06-04 11:19:53 +08:00
|
|
|
if (fen_info->fi->nh) {
|
|
|
|
NL_SET_ERR_MSG_MOD(info->extack, "IPv4 route with nexthop objects is not supported");
|
|
|
|
return notifier_from_errno(-EINVAL);
|
|
|
|
}
|
|
|
|
} else if (info->family == AF_INET6) {
|
|
|
|
struct fib6_entry_notifier_info *fen6_info;
|
|
|
|
|
|
|
|
fen6_info = container_of(info,
|
|
|
|
struct fib6_entry_notifier_info,
|
|
|
|
info);
|
|
|
|
if (fen6_info->rt->nh) {
|
|
|
|
NL_SET_ERR_MSG_MOD(info->extack, "IPv6 route with nexthop objects is not supported");
|
|
|
|
return notifier_from_errno(-EINVAL);
|
|
|
|
}
|
2019-04-06 07:30:39 +08:00
|
|
|
}
|
2018-05-02 15:17:35 +08:00
|
|
|
break;
|
2017-10-28 08:37:14 +08:00
|
|
|
}
|
|
|
|
|
2016-12-03 23:45:01 +08:00
|
|
|
fib_work = kzalloc(sizeof(*fib_work), GFP_ATOMIC);
|
|
|
|
if (WARN_ON(!fib_work))
|
|
|
|
return NOTIFY_BAD;
|
|
|
|
|
2017-05-17 01:38:28 +08:00
|
|
|
fib_work->mlxsw_sp = router->mlxsw_sp;
|
2016-12-03 23:45:01 +08:00
|
|
|
fib_work->event = event;
|
|
|
|
|
2017-08-03 19:28:26 +08:00
|
|
|
switch (info->family) {
|
|
|
|
case AF_INET:
|
|
|
|
INIT_WORK(&fib_work->work, mlxsw_sp_router_fib4_event_work);
|
|
|
|
mlxsw_sp_router_fib4_event(fib_work, info);
|
2016-12-03 23:45:01 +08:00
|
|
|
break;
|
2017-08-03 19:28:26 +08:00
|
|
|
case AF_INET6:
|
|
|
|
INIT_WORK(&fib_work->work, mlxsw_sp_router_fib6_event_work);
|
2019-06-18 23:12:51 +08:00
|
|
|
err = mlxsw_sp_router_fib6_event(fib_work, info);
|
|
|
|
if (err)
|
|
|
|
goto err_fib_event;
|
mlxsw: spectrum_router: Reflect nexthop status changes
When a packet hits a multipath route in the device's routing table, a
hash is computed over its headers, which is then used to select the
appropriate nexthop from the device's adjacency table.
There are situations in which the kernel removes a nexthop from a
multipath route (e.g., no carrier) and the device should do the same.
Upon the reception of NH_{ADD,DEL} events, add or remove a nexthop from
the device's adjacency table and refresh all the routes using the
nexthop group. If all the nexthops of a multipath route are invalid,
then any packet hitting the route would be trapped to the CPU for
forwarding.
If all the nexthops are DEAD, then the kernel would remove the route
entirely. On the other hand, if all the nexthops are merely LINKDOWN,
then the kernel would keep the route and forward any incoming packet
using a different route.
While the last case might sound like a problem, it's expected that a
routing daemon running in user space would remove such a route from the
FIB as it's dumped with the DEAD flag set.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-02-08 18:16:40 +08:00
|
|
|
break;
|
2018-03-26 20:01:44 +08:00
|
|
|
case RTNL_FAMILY_IP6MR:
|
2017-09-27 14:23:20 +08:00
|
|
|
case RTNL_FAMILY_IPMR:
|
|
|
|
INIT_WORK(&fib_work->work, mlxsw_sp_router_fibmr_event_work);
|
|
|
|
mlxsw_sp_router_fibmr_event(fib_work, info);
|
|
|
|
break;
|
2016-12-03 23:45:01 +08:00
|
|
|
}
|
|
|
|
|
2017-02-06 23:20:10 +08:00
|
|
|
mlxsw_core_schedule_work(&fib_work->work);
|
2016-12-03 23:45:01 +08:00
|
|
|
|
2016-09-26 18:52:31 +08:00
|
|
|
return NOTIFY_DONE;
|
2019-06-18 23:12:51 +08:00
|
|
|
|
|
|
|
err_fib_event:
|
|
|
|
kfree(fib_work);
|
|
|
|
return NOTIFY_BAD;
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:59 +08:00
|
|
|
static struct mlxsw_sp_rif *
|
2017-03-10 15:53:39 +08:00
|
|
|
mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *dev)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++)
|
2017-05-17 01:38:27 +08:00
|
|
|
if (mlxsw_sp->router->rifs[i] &&
|
|
|
|
mlxsw_sp->router->rifs[i]->dev == dev)
|
|
|
|
return mlxsw_sp->router->rifs[i];
|
2017-03-10 15:53:39 +08:00
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:59 +08:00
|
|
|
bool mlxsw_sp_rif_exists(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *dev)
|
|
|
|
{
|
|
|
|
return !!mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:58 +08:00
|
|
|
u16 mlxsw_sp_rif_vid(struct mlxsw_sp *mlxsw_sp, const struct net_device *dev)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
u16 vid = 0;
|
|
|
|
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!rif)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
/* We only return the VID for VLAN RIFs. Otherwise we return an
|
|
|
|
* invalid value (0).
|
|
|
|
*/
|
|
|
|
if (rif->ops->type != MLXSW_SP_RIF_TYPE_VLAN)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
vid = mlxsw_sp_fid_8021q_vid(rif->fid);
|
|
|
|
|
|
|
|
out:
|
|
|
|
return vid;
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
static int mlxsw_sp_router_rif_disable(struct mlxsw_sp *mlxsw_sp, u16 rif)
|
|
|
|
{
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
int err;
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_rif_pack(ritr_pl, rif);
|
|
|
|
err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
2019-02-13 00:29:52 +08:00
|
|
|
if (err)
|
2017-03-10 15:53:39 +08:00
|
|
|
return err;
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_enable_set(ritr_pl, false);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_router_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-03-17 16:38:00 +08:00
|
|
|
mlxsw_sp_router_rif_disable(mlxsw_sp, rif->rif_index);
|
|
|
|
mlxsw_sp_nexthop_rif_gone_sync(mlxsw_sp, rif);
|
|
|
|
mlxsw_sp_neigh_rif_gone_sync(mlxsw_sp, rif);
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:13 +08:00
|
|
|
static bool
|
|
|
|
mlxsw_sp_rif_should_config(struct mlxsw_sp_rif *rif, struct net_device *dev,
|
|
|
|
unsigned long event)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-07-18 16:10:13 +08:00
|
|
|
struct inet6_dev *inet6_dev;
|
|
|
|
bool addr_list_empty = true;
|
|
|
|
struct in_device *idev;
|
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
switch (event) {
|
|
|
|
case NETDEV_UP:
|
2017-07-31 15:27:28 +08:00
|
|
|
return rif == NULL;
|
2017-03-10 15:53:39 +08:00
|
|
|
case NETDEV_DOWN:
|
2020-02-20 15:07:54 +08:00
|
|
|
rcu_read_lock();
|
|
|
|
idev = __in_dev_get_rcu(dev);
|
2017-07-18 16:10:13 +08:00
|
|
|
if (idev && idev->ifa_list)
|
|
|
|
addr_list_empty = false;
|
|
|
|
|
|
|
|
inet6_dev = __in6_dev_get(dev);
|
|
|
|
if (addr_list_empty && inet6_dev &&
|
|
|
|
!list_empty(&inet6_dev->addr_list))
|
|
|
|
addr_list_empty = false;
|
2020-02-20 15:07:54 +08:00
|
|
|
rcu_read_unlock();
|
2017-07-18 16:10:13 +08:00
|
|
|
|
2018-07-14 16:39:52 +08:00
|
|
|
/* macvlans do not have a RIF, but rather piggy back on the
|
|
|
|
* RIF of their lower device.
|
|
|
|
*/
|
|
|
|
if (netif_is_macvlan(dev) && addr_list_empty)
|
|
|
|
return true;
|
|
|
|
|
2017-07-18 16:10:13 +08:00
|
|
|
if (rif && addr_list_empty &&
|
2017-03-17 16:38:00 +08:00
|
|
|
!netif_is_l3_slave(rif->dev))
|
2017-03-10 15:53:39 +08:00
|
|
|
return true;
|
|
|
|
/* It is possible we already removed the RIF ourselves
|
|
|
|
* if it was assigned to a netdev that is now a bridge
|
|
|
|
* or LAG slave.
|
|
|
|
*/
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static enum mlxsw_sp_rif_type
|
|
|
|
mlxsw_sp_dev_rif_type(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *dev)
|
|
|
|
{
|
|
|
|
enum mlxsw_sp_fid_type type;
|
|
|
|
|
2017-09-03 05:49:19 +08:00
|
|
|
if (mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL))
|
|
|
|
return MLXSW_SP_RIF_TYPE_IPIP_LB;
|
|
|
|
|
|
|
|
/* Otherwise RIF type is derived from the type of the underlying FID. */
|
2017-05-26 14:37:40 +08:00
|
|
|
if (is_vlan_dev(dev) && netif_is_bridge_master(vlan_dev_real_dev(dev)))
|
|
|
|
type = MLXSW_SP_FID_TYPE_8021Q;
|
|
|
|
else if (netif_is_bridge_master(dev) && br_vlan_enabled(dev))
|
|
|
|
type = MLXSW_SP_FID_TYPE_8021Q;
|
|
|
|
else if (netif_is_bridge_master(dev))
|
|
|
|
type = MLXSW_SP_FID_TYPE_8021D;
|
|
|
|
else
|
|
|
|
type = MLXSW_SP_FID_TYPE_RFID;
|
|
|
|
|
|
|
|
return mlxsw_sp_fid_type_rif_type(mlxsw_sp, type);
|
|
|
|
}
|
|
|
|
|
2017-06-04 22:53:40 +08:00
|
|
|
static int mlxsw_sp_rif_index_alloc(struct mlxsw_sp *mlxsw_sp, u16 *p_rif_index)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
2017-06-04 22:53:40 +08:00
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) {
|
|
|
|
if (!mlxsw_sp->router->rifs[i]) {
|
|
|
|
*p_rif_index = i;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-06-04 22:53:40 +08:00
|
|
|
return -ENOBUFS;
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static struct mlxsw_sp_rif *mlxsw_sp_rif_alloc(size_t rif_size, u16 rif_index,
|
|
|
|
u16 vr_id,
|
|
|
|
struct net_device *l3_dev)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
rif = kzalloc(rif_size, GFP_KERNEL);
|
2017-03-17 16:38:00 +08:00
|
|
|
if (!rif)
|
2017-03-10 15:53:39 +08:00
|
|
|
return NULL;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
INIT_LIST_HEAD(&rif->nexthop_list);
|
|
|
|
INIT_LIST_HEAD(&rif->neigh_list);
|
2019-01-20 14:50:49 +08:00
|
|
|
if (l3_dev) {
|
|
|
|
ether_addr_copy(rif->addr, l3_dev->dev_addr);
|
|
|
|
rif->mtu = l3_dev->mtu;
|
|
|
|
rif->dev = l3_dev;
|
|
|
|
}
|
2017-03-17 16:38:00 +08:00
|
|
|
rif->vr_id = vr_id;
|
|
|
|
rif->rif_index = rif_index;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
return rif;
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2017-05-17 01:38:27 +08:00
|
|
|
struct mlxsw_sp_rif *mlxsw_sp_rif_by_index(const struct mlxsw_sp *mlxsw_sp,
|
|
|
|
u16 rif_index)
|
|
|
|
{
|
|
|
|
return mlxsw_sp->router->rifs[rif_index];
|
|
|
|
}
|
|
|
|
|
2017-03-28 23:24:16 +08:00
|
|
|
u16 mlxsw_sp_rif_index(const struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
return rif->rif_index;
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:28 +08:00
|
|
|
u16 mlxsw_sp_ipip_lb_rif_index(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
|
|
|
|
{
|
|
|
|
return lb_rif->common.rif_index;
|
|
|
|
}
|
|
|
|
|
|
|
|
u16 mlxsw_sp_ipip_lb_ul_vr_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
|
|
|
|
{
|
2019-01-20 14:50:48 +08:00
|
|
|
u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(lb_rif->common.dev);
|
|
|
|
struct mlxsw_sp_vr *ul_vr;
|
|
|
|
|
|
|
|
ul_vr = mlxsw_sp_vr_get(lb_rif->common.mlxsw_sp, ul_tb_id, NULL);
|
|
|
|
if (WARN_ON(IS_ERR(ul_vr)))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
return ul_vr->id;
|
2017-09-03 05:49:28 +08:00
|
|
|
}
|
|
|
|
|
2019-01-20 14:50:50 +08:00
|
|
|
u16 mlxsw_sp_ipip_lb_ul_rif_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
|
|
|
|
{
|
|
|
|
return lb_rif->ul_rif_id;
|
|
|
|
}
|
|
|
|
|
2017-03-28 23:24:16 +08:00
|
|
|
int mlxsw_sp_rif_dev_ifindex(const struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
return rif->dev->ifindex;
|
|
|
|
}
|
|
|
|
|
2017-09-19 16:00:19 +08:00
|
|
|
const struct net_device *mlxsw_sp_rif_dev(const struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
return rif->dev;
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
static struct mlxsw_sp_rif *
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp,
|
2017-10-19 00:56:56 +08:00
|
|
|
const struct mlxsw_sp_rif_params *params,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-05-26 14:37:40 +08:00
|
|
|
u32 tb_id = l3mdev_fib_table(params->dev);
|
|
|
|
const struct mlxsw_sp_rif_ops *ops;
|
2017-09-03 05:49:18 +08:00
|
|
|
struct mlxsw_sp_fid *fid = NULL;
|
2017-05-26 14:37:40 +08:00
|
|
|
enum mlxsw_sp_rif_type type;
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-05-26 14:37:39 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
u16 rif_index;
|
2018-03-26 20:01:40 +08:00
|
|
|
int i, err;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
type = mlxsw_sp_dev_rif_type(mlxsw_sp, params->dev);
|
2019-01-20 14:50:41 +08:00
|
|
|
ops = mlxsw_sp->rif_ops_arr[type];
|
2017-05-26 14:37:40 +08:00
|
|
|
|
2017-10-19 00:56:56 +08:00
|
|
|
vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id ? : RT_TABLE_MAIN, extack);
|
2017-05-26 14:37:38 +08:00
|
|
|
if (IS_ERR(vr))
|
|
|
|
return ERR_CAST(vr);
|
2017-10-02 18:14:56 +08:00
|
|
|
vr->rif_count++;
|
2017-05-26 14:37:38 +08:00
|
|
|
|
2017-06-04 22:53:40 +08:00
|
|
|
err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index);
|
2017-10-19 00:56:56 +08:00
|
|
|
if (err) {
|
2018-02-13 18:29:05 +08:00
|
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interfaces");
|
2017-06-04 22:53:40 +08:00
|
|
|
goto err_rif_index_alloc;
|
2017-10-19 00:56:56 +08:00
|
|
|
}
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
rif = mlxsw_sp_rif_alloc(ops->rif_size, rif_index, vr->id, params->dev);
|
2017-05-26 14:37:33 +08:00
|
|
|
if (!rif) {
|
|
|
|
err = -ENOMEM;
|
|
|
|
goto err_rif_alloc;
|
|
|
|
}
|
2018-12-19 14:08:50 +08:00
|
|
|
dev_hold(rif->dev);
|
2019-01-20 14:50:46 +08:00
|
|
|
mlxsw_sp->router->rifs[rif_index] = rif;
|
2017-05-26 14:37:40 +08:00
|
|
|
rif->mlxsw_sp = mlxsw_sp;
|
|
|
|
rif->ops = ops;
|
2017-05-26 14:37:33 +08:00
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
if (ops->fid_get) {
|
2018-06-25 15:48:13 +08:00
|
|
|
fid = ops->fid_get(rif, extack);
|
2017-09-03 05:49:18 +08:00
|
|
|
if (IS_ERR(fid)) {
|
|
|
|
err = PTR_ERR(fid);
|
|
|
|
goto err_fid_get;
|
|
|
|
}
|
|
|
|
rif->fid = fid;
|
2017-05-26 14:37:34 +08:00
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
if (ops->setup)
|
|
|
|
ops->setup(rif, params);
|
|
|
|
|
|
|
|
err = ops->configure(rif);
|
2017-03-10 15:53:39 +08:00
|
|
|
if (err)
|
2017-05-26 14:37:40 +08:00
|
|
|
goto err_configure;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2018-03-26 20:01:40 +08:00
|
|
|
for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++) {
|
|
|
|
err = mlxsw_sp_mr_rif_add(vr->mr_table[i], rif);
|
|
|
|
if (err)
|
|
|
|
goto err_mr_rif_add;
|
|
|
|
}
|
2017-09-27 14:23:20 +08:00
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_counters_alloc(rif);
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
return rif;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-09-27 14:23:20 +08:00
|
|
|
err_mr_rif_add:
|
2018-03-26 20:01:40 +08:00
|
|
|
for (i--; i >= 0; i--)
|
|
|
|
mlxsw_sp_mr_rif_del(vr->mr_table[i], rif);
|
2017-09-27 14:23:20 +08:00
|
|
|
ops->deconfigure(rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
err_configure:
|
2017-09-03 05:49:18 +08:00
|
|
|
if (fid)
|
|
|
|
mlxsw_sp_fid_put(fid);
|
2017-05-26 14:37:39 +08:00
|
|
|
err_fid_get:
|
2019-01-20 14:50:46 +08:00
|
|
|
mlxsw_sp->router->rifs[rif_index] = NULL;
|
2018-12-19 14:08:50 +08:00
|
|
|
dev_put(rif->dev);
|
2017-05-26 14:37:40 +08:00
|
|
|
kfree(rif);
|
|
|
|
err_rif_alloc:
|
2017-06-04 22:53:40 +08:00
|
|
|
err_rif_index_alloc:
|
2017-10-02 18:14:56 +08:00
|
|
|
vr->rif_count--;
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
2017-03-10 15:53:39 +08:00
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
static void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-05-26 14:37:40 +08:00
|
|
|
const struct mlxsw_sp_rif_ops *ops = rif->ops;
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
2017-05-26 14:37:39 +08:00
|
|
|
struct mlxsw_sp_fid *fid = rif->fid;
|
2017-05-26 14:37:40 +08:00
|
|
|
struct mlxsw_sp_vr *vr;
|
2018-03-26 20:01:40 +08:00
|
|
|
int i;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
mlxsw_sp_router_rif_gone_sync(mlxsw_sp, rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
vr = &mlxsw_sp->router->vrs[rif->vr_id];
|
2017-03-28 23:24:15 +08:00
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_counters_free(rif);
|
2018-03-26 20:01:40 +08:00
|
|
|
for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++)
|
|
|
|
mlxsw_sp_mr_rif_del(vr->mr_table[i], rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
ops->deconfigure(rif);
|
2017-09-03 05:49:18 +08:00
|
|
|
if (fid)
|
|
|
|
/* Loopback RIFs are not associated with a FID. */
|
|
|
|
mlxsw_sp_fid_put(fid);
|
2019-01-20 14:50:46 +08:00
|
|
|
mlxsw_sp->router->rifs[rif->rif_index] = NULL;
|
2018-12-19 14:08:50 +08:00
|
|
|
dev_put(rif->dev);
|
2017-05-26 14:37:40 +08:00
|
|
|
kfree(rif);
|
2017-10-02 18:14:56 +08:00
|
|
|
vr->rif_count--;
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2018-08-24 20:41:35 +08:00
|
|
|
void mlxsw_sp_rif_destroy_by_dev(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *dev)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!rif)
|
|
|
|
return;
|
|
|
|
mlxsw_sp_rif_destroy(rif);
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static void
|
|
|
|
mlxsw_sp_rif_subport_params_init(struct mlxsw_sp_rif_params *params,
|
|
|
|
struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
|
|
|
|
|
|
|
|
params->vid = mlxsw_sp_port_vlan->vid;
|
|
|
|
params->lag = mlxsw_sp_port->lagged;
|
|
|
|
if (params->lag)
|
|
|
|
params->lag_id = mlxsw_sp_port->lag_id;
|
|
|
|
else
|
|
|
|
params->system_port = mlxsw_sp_port->local_port;
|
|
|
|
}
|
|
|
|
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
static struct mlxsw_sp_rif_subport *
|
|
|
|
mlxsw_sp_rif_subport_rif(const struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
return container_of(rif, struct mlxsw_sp_rif_subport, common);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_rif *
|
|
|
|
mlxsw_sp_rif_subport_get(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct mlxsw_sp_rif_params *params,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_subport *rif_subport;
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, params->dev);
|
|
|
|
if (!rif)
|
|
|
|
return mlxsw_sp_rif_create(mlxsw_sp, params, extack);
|
|
|
|
|
|
|
|
rif_subport = mlxsw_sp_rif_subport_rif(rif);
|
|
|
|
refcount_inc(&rif_subport->ref_count);
|
|
|
|
return rif;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_rif_subport_put(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_subport *rif_subport;
|
|
|
|
|
|
|
|
rif_subport = mlxsw_sp_rif_subport_rif(rif);
|
|
|
|
if (!refcount_dec_and_test(&rif_subport->ref_count))
|
|
|
|
return;
|
|
|
|
|
|
|
|
mlxsw_sp_rif_destroy(rif);
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:28 +08:00
|
|
|
static int
|
2017-05-26 14:37:39 +08:00
|
|
|
mlxsw_sp_port_vlan_router_join(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan,
|
2017-10-19 00:56:56 +08:00
|
|
|
struct net_device *l3_dev,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-05-26 14:37:28 +08:00
|
|
|
struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
|
2017-05-26 14:37:36 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
struct mlxsw_sp_rif_params params = {
|
|
|
|
.dev = l3_dev,
|
|
|
|
};
|
2017-05-26 14:37:28 +08:00
|
|
|
u16 vid = mlxsw_sp_port_vlan->vid;
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-05-26 14:37:39 +08:00
|
|
|
struct mlxsw_sp_fid *fid;
|
2017-05-24 03:56:30 +08:00
|
|
|
int err;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
mlxsw_sp_rif_subport_params_init(¶ms, mlxsw_sp_port_vlan);
|
|
|
|
rif = mlxsw_sp_rif_subport_get(mlxsw_sp, ¶ms, extack);
|
|
|
|
if (IS_ERR(rif))
|
|
|
|
return PTR_ERR(rif);
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
/* FID was already created, just take a reference */
|
2018-06-25 15:48:13 +08:00
|
|
|
fid = rif->ops->fid_get(rif, extack);
|
2017-05-26 14:37:39 +08:00
|
|
|
err = mlxsw_sp_fid_port_vid_map(fid, mlxsw_sp_port, vid);
|
|
|
|
if (err)
|
|
|
|
goto err_fid_port_vid_map;
|
|
|
|
|
2017-05-26 14:37:28 +08:00
|
|
|
err = mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, false);
|
2017-05-24 03:56:30 +08:00
|
|
|
if (err)
|
|
|
|
goto err_port_vid_learning_set;
|
|
|
|
|
2017-05-26 14:37:28 +08:00
|
|
|
err = mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid,
|
2017-05-24 03:56:30 +08:00
|
|
|
BR_STATE_FORWARDING);
|
|
|
|
if (err)
|
|
|
|
goto err_port_vid_stp_set;
|
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
mlxsw_sp_port_vlan->fid = fid;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
|
|
|
return 0;
|
2017-05-24 03:56:30 +08:00
|
|
|
|
|
|
|
err_port_vid_stp_set:
|
2017-05-26 14:37:28 +08:00
|
|
|
mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true);
|
2017-05-24 03:56:30 +08:00
|
|
|
err_port_vid_learning_set:
|
2017-05-26 14:37:39 +08:00
|
|
|
mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid);
|
|
|
|
err_fid_port_vid_map:
|
|
|
|
mlxsw_sp_fid_put(fid);
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
mlxsw_sp_rif_subport_put(rif);
|
2017-05-24 03:56:30 +08:00
|
|
|
return err;
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:57 +08:00
|
|
|
static void
|
|
|
|
__mlxsw_sp_port_vlan_router_leave(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-05-26 14:37:27 +08:00
|
|
|
struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
|
2017-05-26 14:37:28 +08:00
|
|
|
struct mlxsw_sp_fid *fid = mlxsw_sp_port_vlan->fid;
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
struct mlxsw_sp_rif *rif = mlxsw_sp_fid_rif(fid);
|
2017-05-26 14:37:27 +08:00
|
|
|
u16 vid = mlxsw_sp_port_vlan->vid;
|
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
if (WARN_ON(mlxsw_sp_fid_type(fid) != MLXSW_SP_FID_TYPE_RFID))
|
|
|
|
return;
|
2017-05-26 14:37:25 +08:00
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
mlxsw_sp_port_vlan->fid = NULL;
|
2017-05-26 14:37:28 +08:00
|
|
|
mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid, BR_STATE_BLOCKING);
|
|
|
|
mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true);
|
2017-05-26 14:37:39 +08:00
|
|
|
mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid);
|
|
|
|
mlxsw_sp_fid_put(fid);
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
mlxsw_sp_rif_subport_put(rif);
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:57 +08:00
|
|
|
void
|
|
|
|
mlxsw_sp_port_vlan_router_leave(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
|
|
|
|
{
|
|
|
|
__mlxsw_sp_port_vlan_router_leave(mlxsw_sp_port_vlan);
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:28 +08:00
|
|
|
static int mlxsw_sp_inetaddr_port_vlan_event(struct net_device *l3_dev,
|
|
|
|
struct net_device *port_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event, u16 vid,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_port *mlxsw_sp_port = netdev_priv(port_dev);
|
2017-05-26 14:37:27 +08:00
|
|
|
struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-05-26 14:37:27 +08:00
|
|
|
mlxsw_sp_port_vlan = mlxsw_sp_port_vlan_find_by_vid(mlxsw_sp_port, vid);
|
2017-05-26 14:37:28 +08:00
|
|
|
if (WARN_ON(!mlxsw_sp_port_vlan))
|
|
|
|
return -EINVAL;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case NETDEV_UP:
|
2017-05-26 14:37:39 +08:00
|
|
|
return mlxsw_sp_port_vlan_router_join(mlxsw_sp_port_vlan,
|
2017-10-19 00:56:56 +08:00
|
|
|
l3_dev, extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
case NETDEV_DOWN:
|
2020-02-20 15:07:57 +08:00
|
|
|
__mlxsw_sp_port_vlan_router_leave(mlxsw_sp_port_vlan);
|
2017-03-10 15:53:39 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_inetaddr_port_event(struct net_device *port_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-04-18 22:55:37 +08:00
|
|
|
if (netif_is_bridge_port(port_dev) ||
|
|
|
|
netif_is_lag_port(port_dev) ||
|
|
|
|
netif_is_ovs_port(port_dev))
|
2017-03-10 15:53:39 +08:00
|
|
|
return 0;
|
|
|
|
|
2018-12-21 03:42:26 +08:00
|
|
|
return mlxsw_sp_inetaddr_port_vlan_event(port_dev, port_dev, event,
|
|
|
|
MLXSW_SP_DEFAULT_VID, extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int __mlxsw_sp_inetaddr_lag_event(struct net_device *l3_dev,
|
|
|
|
struct net_device *lag_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event, u16 vid,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
|
|
|
struct net_device *port_dev;
|
|
|
|
struct list_head *iter;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
netdev_for_each_lower_dev(lag_dev, port_dev, iter) {
|
|
|
|
if (mlxsw_sp_port_dev_check(port_dev)) {
|
2017-05-26 14:37:28 +08:00
|
|
|
err = mlxsw_sp_inetaddr_port_vlan_event(l3_dev,
|
|
|
|
port_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
event, vid,
|
|
|
|
extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_inetaddr_lag_event(struct net_device *lag_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
|
|
|
if (netif_is_bridge_port(lag_dev))
|
|
|
|
return 0;
|
|
|
|
|
2018-12-21 03:42:26 +08:00
|
|
|
return __mlxsw_sp_inetaddr_lag_event(lag_dev, lag_dev, event,
|
|
|
|
MLXSW_SP_DEFAULT_VID, extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
}
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
static int mlxsw_sp_inetaddr_bridge_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *l3_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2017-05-26 14:37:40 +08:00
|
|
|
struct mlxsw_sp_rif_params params = {
|
|
|
|
.dev = l3_dev,
|
|
|
|
};
|
2017-05-26 14:37:39 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case NETDEV_UP:
|
2017-10-19 00:56:56 +08:00
|
|
|
rif = mlxsw_sp_rif_create(mlxsw_sp, ¶ms, extack);
|
2017-05-26 14:37:40 +08:00
|
|
|
if (IS_ERR(rif))
|
|
|
|
return PTR_ERR(rif);
|
|
|
|
break;
|
2017-03-10 15:53:39 +08:00
|
|
|
case NETDEV_DOWN:
|
2017-05-26 14:37:39 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_destroy(rif);
|
2017-03-10 15:53:39 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
static int mlxsw_sp_inetaddr_vlan_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *vlan_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
|
|
|
struct net_device *real_dev = vlan_dev_real_dev(vlan_dev);
|
|
|
|
u16 vid = vlan_dev_vlan_id(vlan_dev);
|
|
|
|
|
2017-06-28 14:03:12 +08:00
|
|
|
if (netif_is_bridge_port(vlan_dev))
|
|
|
|
return 0;
|
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
if (mlxsw_sp_port_dev_check(real_dev))
|
2017-05-26 14:37:28 +08:00
|
|
|
return mlxsw_sp_inetaddr_port_vlan_event(vlan_dev, real_dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
event, vid, extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
else if (netif_is_lag_master(real_dev))
|
|
|
|
return __mlxsw_sp_inetaddr_lag_event(vlan_dev, real_dev, event,
|
2017-10-19 00:56:56 +08:00
|
|
|
vid, extack);
|
mlxsw: spectrum: Replace vPorts with Port-VLAN
As explained in the cover letter, since the introduction of the bridge
offload in the mlxsw driver, information related to the offloaded bridge
and bridge ports was stored in the individual port struct,
mlxsw_sp_port.
This lead to a bloated struct storing both physical properties of the
port (e.g., autoneg status) as well as logical properties of an upper
bridge port (e.g., learning, mrouter indication). While this might work
well for simple devices, it proved to be hard to extend when stacked
devices were taken into account and more advanced use-cases (e.g., IGMP
snooping) considered.
This patch removes the excess information from the above struct and
instead stores it in more appropriate structs that represent the bridge
port, the bridge itself and a VLAN configured on the bridge port.
The membership of a port in a bridge is denoted using the Port-VLAN
struct, which points to the bridge port and also member in the bridge
VLAN group of the VLAN it represents. This allows us to completely
remove the vPort abstraction and consolidate many of the code paths
relating to VLAN-aware and unaware bridges.
Note that the FID / vFID code is currently duplicated, but this will
soon go away when the common FID core will be introduced.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Signed-off-by: Jiri Pirko <jiri@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-05-26 14:37:31 +08:00
|
|
|
else if (netif_is_bridge_master(real_dev) && br_vlan_enabled(real_dev))
|
2018-12-19 14:08:47 +08:00
|
|
|
return mlxsw_sp_inetaddr_bridge_event(mlxsw_sp, vlan_dev, event,
|
|
|
|
extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-07-14 16:39:54 +08:00
|
|
|
static bool mlxsw_sp_rif_macvlan_is_vrrp4(const u8 *mac)
|
|
|
|
{
|
|
|
|
u8 vrrp4[ETH_ALEN] = { 0x00, 0x00, 0x5e, 0x00, 0x01, 0x00 };
|
|
|
|
u8 mask[ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0x00 };
|
|
|
|
|
|
|
|
return ether_addr_equal_masked(mac, vrrp4, mask);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool mlxsw_sp_rif_macvlan_is_vrrp6(const u8 *mac)
|
|
|
|
{
|
|
|
|
u8 vrrp6[ETH_ALEN] = { 0x00, 0x00, 0x5e, 0x00, 0x02, 0x00 };
|
|
|
|
u8 mask[ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0x00 };
|
|
|
|
|
|
|
|
return ether_addr_equal_masked(mac, vrrp6, mask);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_vrrp_op(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
|
|
|
|
const u8 *mac, bool adding)
|
|
|
|
{
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
u8 vrrp_id = adding ? mac[5] : 0;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (!mlxsw_sp_rif_macvlan_is_vrrp4(mac) &&
|
|
|
|
!mlxsw_sp_rif_macvlan_is_vrrp6(mac))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
|
|
|
|
err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
if (mlxsw_sp_rif_macvlan_is_vrrp4(mac))
|
|
|
|
mlxsw_reg_ritr_if_vrrp_id_ipv4_set(ritr_pl, vrrp_id);
|
|
|
|
else
|
|
|
|
mlxsw_reg_ritr_if_vrrp_id_ipv6_set(ritr_pl, vrrp_id);
|
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
2018-07-14 16:39:52 +08:00
|
|
|
static int mlxsw_sp_rif_macvlan_add(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *macvlan_dev,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct macvlan_dev *vlan = netdev_priv(macvlan_dev);
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, vlan->lowerdev);
|
|
|
|
if (!rif) {
|
|
|
|
NL_SET_ERR_MSG_MOD(extack, "macvlan is only supported on top of router interfaces");
|
|
|
|
return -EOPNOTSUPP;
|
|
|
|
}
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), true);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2018-07-14 16:39:54 +08:00
|
|
|
err = mlxsw_sp_rif_vrrp_op(mlxsw_sp, rif->rif_index,
|
|
|
|
macvlan_dev->dev_addr, true);
|
|
|
|
if (err)
|
|
|
|
goto err_rif_vrrp_add;
|
|
|
|
|
2018-07-14 16:39:52 +08:00
|
|
|
/* Make sure the bridge driver does not have this MAC pointing at
|
|
|
|
* some other port.
|
|
|
|
*/
|
|
|
|
if (rif->ops->fdb_del)
|
|
|
|
rif->ops->fdb_del(rif, macvlan_dev->dev_addr);
|
|
|
|
|
|
|
|
return 0;
|
2018-07-14 16:39:54 +08:00
|
|
|
|
|
|
|
err_rif_vrrp_add:
|
|
|
|
mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), false);
|
|
|
|
return err;
|
2018-07-14 16:39:52 +08:00
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:56 +08:00
|
|
|
static void __mlxsw_sp_rif_macvlan_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *macvlan_dev)
|
2018-07-14 16:39:52 +08:00
|
|
|
{
|
|
|
|
struct macvlan_dev *vlan = netdev_priv(macvlan_dev);
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, vlan->lowerdev);
|
|
|
|
/* If we do not have a RIF, then we already took care of
|
|
|
|
* removing the macvlan's MAC during RIF deletion.
|
|
|
|
*/
|
|
|
|
if (!rif)
|
|
|
|
return;
|
2018-07-14 16:39:54 +08:00
|
|
|
mlxsw_sp_rif_vrrp_op(mlxsw_sp, rif->rif_index, macvlan_dev->dev_addr,
|
|
|
|
false);
|
2018-07-14 16:39:52 +08:00
|
|
|
mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), false);
|
|
|
|
}
|
|
|
|
|
2020-02-20 15:07:56 +08:00
|
|
|
void mlxsw_sp_rif_macvlan_del(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
const struct net_device *macvlan_dev)
|
|
|
|
{
|
|
|
|
__mlxsw_sp_rif_macvlan_del(mlxsw_sp, macvlan_dev);
|
|
|
|
}
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
static int mlxsw_sp_inetaddr_macvlan_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *macvlan_dev,
|
2018-07-14 16:39:52 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
switch (event) {
|
|
|
|
case NETDEV_UP:
|
|
|
|
return mlxsw_sp_rif_macvlan_add(mlxsw_sp, macvlan_dev, extack);
|
|
|
|
case NETDEV_DOWN:
|
2020-02-20 15:07:56 +08:00
|
|
|
__mlxsw_sp_rif_macvlan_del(mlxsw_sp, macvlan_dev);
|
2018-07-14 16:39:52 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-12-13 19:54:52 +08:00
|
|
|
static int mlxsw_sp_router_port_check_rif_addr(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *dev,
|
|
|
|
const unsigned char *dev_addr,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
/* A RIF is not created for macvlan netdevs. Their MAC is used to
|
|
|
|
* populate the FDB
|
|
|
|
*/
|
2019-04-10 14:58:15 +08:00
|
|
|
if (netif_is_macvlan(dev) || netif_is_l3_master(dev))
|
2018-12-13 19:54:52 +08:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) {
|
|
|
|
rif = mlxsw_sp->router->rifs[i];
|
2019-12-29 19:40:22 +08:00
|
|
|
if (rif && rif->ops &&
|
|
|
|
rif->ops->type == MLXSW_SP_RIF_TYPE_IPIP_LB)
|
|
|
|
continue;
|
2019-01-20 14:50:49 +08:00
|
|
|
if (rif && rif->dev && rif->dev != dev &&
|
2018-12-13 19:54:52 +08:00
|
|
|
!ether_addr_equal_masked(rif->dev->dev_addr, dev_addr,
|
|
|
|
mlxsw_sp->mac_mask)) {
|
|
|
|
NL_SET_ERR_MSG_MOD(extack, "All router interface MAC addresses must have the same prefix");
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
static int __mlxsw_sp_inetaddr_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *dev,
|
2017-10-19 00:56:56 +08:00
|
|
|
unsigned long event,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-05-01 00:47:14 +08:00
|
|
|
{
|
|
|
|
if (mlxsw_sp_port_dev_check(dev))
|
2017-10-19 00:56:56 +08:00
|
|
|
return mlxsw_sp_inetaddr_port_event(dev, event, extack);
|
2017-05-01 00:47:14 +08:00
|
|
|
else if (netif_is_lag_master(dev))
|
2017-10-19 00:56:56 +08:00
|
|
|
return mlxsw_sp_inetaddr_lag_event(dev, event, extack);
|
2017-05-01 00:47:14 +08:00
|
|
|
else if (netif_is_bridge_master(dev))
|
2018-12-19 14:08:47 +08:00
|
|
|
return mlxsw_sp_inetaddr_bridge_event(mlxsw_sp, dev, event,
|
|
|
|
extack);
|
2017-05-01 00:47:14 +08:00
|
|
|
else if (is_vlan_dev(dev))
|
2018-12-19 14:08:47 +08:00
|
|
|
return mlxsw_sp_inetaddr_vlan_event(mlxsw_sp, dev, event,
|
|
|
|
extack);
|
2018-07-14 16:39:52 +08:00
|
|
|
else if (netif_is_macvlan(dev))
|
2018-12-19 14:08:47 +08:00
|
|
|
return mlxsw_sp_inetaddr_macvlan_event(mlxsw_sp, dev, event,
|
|
|
|
extack);
|
2017-05-01 00:47:14 +08:00
|
|
|
else
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-12-19 14:08:48 +08:00
|
|
|
static int mlxsw_sp_inetaddr_event(struct notifier_block *nb,
|
|
|
|
unsigned long event, void *ptr)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
|
|
|
struct in_ifaddr *ifa = (struct in_ifaddr *) ptr;
|
|
|
|
struct net_device *dev = ifa->ifa_dev->dev;
|
2018-12-19 14:08:48 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2017-03-17 16:38:00 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-03-10 15:53:39 +08:00
|
|
|
int err = 0;
|
|
|
|
|
2017-10-19 00:56:55 +08:00
|
|
|
/* NETDEV_UP event is handled by mlxsw_sp_inetaddr_valid_event */
|
|
|
|
if (event == NETDEV_UP)
|
2020-02-22 01:54:13 +08:00
|
|
|
return NOTIFY_DONE;
|
2017-10-19 00:56:55 +08:00
|
|
|
|
2018-12-19 14:08:48 +08:00
|
|
|
router = container_of(nb, struct mlxsw_sp_router, inetaddr_nb);
|
2020-02-22 01:54:13 +08:00
|
|
|
mutex_lock(&router->lock);
|
2018-12-19 14:08:48 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(router->mlxsw_sp, dev);
|
2017-10-19 00:56:55 +08:00
|
|
|
if (!mlxsw_sp_rif_should_config(rif, dev, event))
|
|
|
|
goto out;
|
|
|
|
|
2018-12-19 14:08:48 +08:00
|
|
|
err = __mlxsw_sp_inetaddr_event(router->mlxsw_sp, dev, event, NULL);
|
2017-10-19 00:56:55 +08:00
|
|
|
out:
|
2020-02-22 01:54:13 +08:00
|
|
|
mutex_unlock(&router->lock);
|
2017-10-19 00:56:55 +08:00
|
|
|
return notifier_from_errno(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
int mlxsw_sp_inetaddr_valid_event(struct notifier_block *unused,
|
|
|
|
unsigned long event, void *ptr)
|
|
|
|
{
|
|
|
|
struct in_validator_info *ivi = (struct in_validator_info *) ptr;
|
|
|
|
struct net_device *dev = ivi->ivi_dev->dev;
|
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
int err = 0;
|
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
mlxsw_sp = mlxsw_sp_lower_get(dev);
|
|
|
|
if (!mlxsw_sp)
|
2020-02-22 01:54:13 +08:00
|
|
|
return NOTIFY_DONE;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2020-02-22 01:54:13 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-03-17 16:38:00 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
2017-07-18 16:10:13 +08:00
|
|
|
if (!mlxsw_sp_rif_should_config(rif, dev, event))
|
2017-03-10 15:53:39 +08:00
|
|
|
goto out;
|
|
|
|
|
2018-12-13 19:54:52 +08:00
|
|
|
err = mlxsw_sp_router_port_check_rif_addr(mlxsw_sp, dev, dev->dev_addr,
|
|
|
|
ivi->extack);
|
|
|
|
if (err)
|
|
|
|
goto out;
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
err = __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, ivi->extack);
|
2017-03-10 15:53:39 +08:00
|
|
|
out:
|
2020-02-22 01:54:13 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-03-10 15:53:39 +08:00
|
|
|
return notifier_from_errno(err);
|
|
|
|
}
|
|
|
|
|
2017-07-18 16:10:13 +08:00
|
|
|
struct mlxsw_sp_inet6addr_event_work {
|
|
|
|
struct work_struct work;
|
2018-12-19 14:08:48 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
2017-07-18 16:10:13 +08:00
|
|
|
struct net_device *dev;
|
|
|
|
unsigned long event;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void mlxsw_sp_inet6addr_event_work(struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_inet6addr_event_work *inet6addr_work =
|
|
|
|
container_of(work, struct mlxsw_sp_inet6addr_event_work, work);
|
2018-12-19 14:08:48 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp = inet6addr_work->mlxsw_sp;
|
2017-07-18 16:10:13 +08:00
|
|
|
struct net_device *dev = inet6addr_work->dev;
|
|
|
|
unsigned long event = inet6addr_work->event;
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
|
|
|
|
rtnl_lock();
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-07-18 16:10:13 +08:00
|
|
|
|
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!mlxsw_sp_rif_should_config(rif, dev, event))
|
|
|
|
goto out;
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
__mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, NULL);
|
2017-07-18 16:10:13 +08:00
|
|
|
out:
|
2020-02-22 01:54:10 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-07-18 16:10:13 +08:00
|
|
|
rtnl_unlock();
|
|
|
|
dev_put(dev);
|
|
|
|
kfree(inet6addr_work);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Called with rcu_read_lock() */
|
2018-12-19 14:08:48 +08:00
|
|
|
static int mlxsw_sp_inet6addr_event(struct notifier_block *nb,
|
|
|
|
unsigned long event, void *ptr)
|
2017-07-18 16:10:13 +08:00
|
|
|
{
|
|
|
|
struct inet6_ifaddr *if6 = (struct inet6_ifaddr *) ptr;
|
|
|
|
struct mlxsw_sp_inet6addr_event_work *inet6addr_work;
|
|
|
|
struct net_device *dev = if6->idev->dev;
|
2018-12-19 14:08:48 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2017-07-18 16:10:13 +08:00
|
|
|
|
2017-10-19 00:56:55 +08:00
|
|
|
/* NETDEV_UP event is handled by mlxsw_sp_inet6addr_valid_event */
|
|
|
|
if (event == NETDEV_UP)
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
|
2017-07-18 16:10:13 +08:00
|
|
|
inet6addr_work = kzalloc(sizeof(*inet6addr_work), GFP_ATOMIC);
|
|
|
|
if (!inet6addr_work)
|
|
|
|
return NOTIFY_BAD;
|
|
|
|
|
2018-12-19 14:08:48 +08:00
|
|
|
router = container_of(nb, struct mlxsw_sp_router, inet6addr_nb);
|
2017-07-18 16:10:13 +08:00
|
|
|
INIT_WORK(&inet6addr_work->work, mlxsw_sp_inet6addr_event_work);
|
2018-12-19 14:08:48 +08:00
|
|
|
inet6addr_work->mlxsw_sp = router->mlxsw_sp;
|
2017-07-18 16:10:13 +08:00
|
|
|
inet6addr_work->dev = dev;
|
|
|
|
inet6addr_work->event = event;
|
|
|
|
dev_hold(dev);
|
|
|
|
mlxsw_core_schedule_work(&inet6addr_work->work);
|
|
|
|
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
}
|
|
|
|
|
2017-10-19 00:56:55 +08:00
|
|
|
int mlxsw_sp_inet6addr_valid_event(struct notifier_block *unused,
|
|
|
|
unsigned long event, void *ptr)
|
|
|
|
{
|
|
|
|
struct in6_validator_info *i6vi = (struct in6_validator_info *) ptr;
|
|
|
|
struct net_device *dev = i6vi->i6vi_dev->dev;
|
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
struct mlxsw_sp_rif *rif;
|
|
|
|
int err = 0;
|
|
|
|
|
|
|
|
mlxsw_sp = mlxsw_sp_lower_get(dev);
|
|
|
|
if (!mlxsw_sp)
|
2020-02-22 01:54:13 +08:00
|
|
|
return NOTIFY_DONE;
|
2017-10-19 00:56:55 +08:00
|
|
|
|
2020-02-22 01:54:13 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-10-19 00:56:55 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!mlxsw_sp_rif_should_config(rif, dev, event))
|
|
|
|
goto out;
|
|
|
|
|
2018-12-13 19:54:52 +08:00
|
|
|
err = mlxsw_sp_router_port_check_rif_addr(mlxsw_sp, dev, dev->dev_addr,
|
|
|
|
i6vi->extack);
|
|
|
|
if (err)
|
|
|
|
goto out;
|
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
err = __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, i6vi->extack);
|
2017-10-19 00:56:55 +08:00
|
|
|
out:
|
2020-02-22 01:54:13 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-10-19 00:56:55 +08:00
|
|
|
return notifier_from_errno(err);
|
|
|
|
}
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
static int mlxsw_sp_rif_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
|
2017-03-10 15:53:39 +08:00
|
|
|
const char *mac, int mtu)
|
|
|
|
{
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
int err;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
|
2017-03-10 15:53:39 +08:00
|
|
|
err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_mtu_set(ritr_pl, mtu);
|
|
|
|
mlxsw_reg_ritr_if_mac_memcpy_to(ritr_pl, mac);
|
|
|
|
mlxsw_reg_ritr_op_set(ritr_pl, MLXSW_REG_RITR_RIF_CREATE);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
2018-12-13 19:54:48 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_router_port_change_event(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct mlxsw_sp_rif *rif)
|
2017-03-10 15:53:39 +08:00
|
|
|
{
|
2018-12-13 19:54:48 +08:00
|
|
|
struct net_device *dev = rif->dev;
|
2017-05-26 14:37:39 +08:00
|
|
|
u16 fid_index;
|
2017-03-10 15:53:39 +08:00
|
|
|
int err;
|
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
fid_index = mlxsw_sp_fid_index(rif->fid);
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
err = mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, false);
|
2017-03-10 15:53:39 +08:00
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
err = mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, dev->dev_addr,
|
|
|
|
dev->mtu);
|
2017-03-10 15:53:39 +08:00
|
|
|
if (err)
|
|
|
|
goto err_rif_edit;
|
|
|
|
|
2017-05-26 14:37:39 +08:00
|
|
|
err = mlxsw_sp_rif_fdb_op(mlxsw_sp, dev->dev_addr, fid_index, true);
|
2017-03-10 15:53:39 +08:00
|
|
|
if (err)
|
|
|
|
goto err_rif_fdb_op;
|
|
|
|
|
2017-09-27 14:23:21 +08:00
|
|
|
if (rif->mtu != dev->mtu) {
|
|
|
|
struct mlxsw_sp_vr *vr;
|
2018-03-26 20:01:40 +08:00
|
|
|
int i;
|
2017-09-27 14:23:21 +08:00
|
|
|
|
|
|
|
/* The RIF is relevant only to its mr_table instance, as unlike
|
|
|
|
* unicast routing, in multicast routing a RIF cannot be shared
|
|
|
|
* between several multicast routing tables.
|
|
|
|
*/
|
|
|
|
vr = &mlxsw_sp->router->vrs[rif->vr_id];
|
2018-03-26 20:01:40 +08:00
|
|
|
for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++)
|
|
|
|
mlxsw_sp_mr_rif_mtu_update(vr->mr_table[i],
|
|
|
|
rif, dev->mtu);
|
2017-09-27 14:23:21 +08:00
|
|
|
}
|
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
ether_addr_copy(rif->addr, dev->dev_addr);
|
|
|
|
rif->mtu = dev->mtu;
|
2017-03-10 15:53:39 +08:00
|
|
|
|
2017-03-17 16:38:00 +08:00
|
|
|
netdev_dbg(dev, "Updated RIF=%d\n", rif->rif_index);
|
2017-03-10 15:53:39 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_rif_fdb_op:
|
2017-03-17 16:38:00 +08:00
|
|
|
mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, rif->addr, rif->mtu);
|
2017-03-10 15:53:39 +08:00
|
|
|
err_rif_edit:
|
2017-05-26 14:37:39 +08:00
|
|
|
mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, true);
|
2017-03-10 15:53:39 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2018-12-13 19:54:52 +08:00
|
|
|
static int mlxsw_sp_router_port_pre_changeaddr_event(struct mlxsw_sp_rif *rif,
|
|
|
|
struct netdev_notifier_pre_changeaddr_info *info)
|
|
|
|
{
|
|
|
|
struct netlink_ext_ack *extack;
|
|
|
|
|
|
|
|
extack = netdev_notifier_info_to_extack(&info->info);
|
|
|
|
return mlxsw_sp_router_port_check_rif_addr(rif->mlxsw_sp, rif->dev,
|
|
|
|
info->dev_addr, extack);
|
|
|
|
}
|
|
|
|
|
2018-12-13 19:54:48 +08:00
|
|
|
int mlxsw_sp_netdevice_router_port_event(struct net_device *dev,
|
|
|
|
unsigned long event, void *ptr)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp;
|
|
|
|
struct mlxsw_sp_rif *rif;
|
2020-02-22 01:54:12 +08:00
|
|
|
int err = 0;
|
2018-12-13 19:54:48 +08:00
|
|
|
|
|
|
|
mlxsw_sp = mlxsw_sp_lower_get(dev);
|
|
|
|
if (!mlxsw_sp)
|
|
|
|
return 0;
|
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2018-12-13 19:54:48 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
|
|
|
|
if (!rif)
|
2020-02-22 01:54:12 +08:00
|
|
|
goto out;
|
2018-12-13 19:54:48 +08:00
|
|
|
|
|
|
|
switch (event) {
|
|
|
|
case NETDEV_CHANGEMTU: /* fall through */
|
|
|
|
case NETDEV_CHANGEADDR:
|
2020-02-22 01:54:12 +08:00
|
|
|
err = mlxsw_sp_router_port_change_event(mlxsw_sp, rif);
|
|
|
|
break;
|
2018-12-13 19:54:52 +08:00
|
|
|
case NETDEV_PRE_CHANGEADDR:
|
2020-02-22 01:54:12 +08:00
|
|
|
err = mlxsw_sp_router_port_pre_changeaddr_event(rif, ptr);
|
|
|
|
break;
|
2018-12-13 19:54:48 +08:00
|
|
|
}
|
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
out:
|
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
|
|
|
return err;
|
2018-12-13 19:54:48 +08:00
|
|
|
}
|
|
|
|
|
2017-05-01 00:47:14 +08:00
|
|
|
static int mlxsw_sp_port_vrf_join(struct mlxsw_sp *mlxsw_sp,
|
2017-10-19 00:56:56 +08:00
|
|
|
struct net_device *l3_dev,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-03-16 16:08:18 +08:00
|
|
|
{
|
2017-05-01 00:47:14 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-03-16 16:08:18 +08:00
|
|
|
|
2017-05-01 00:47:14 +08:00
|
|
|
/* If netdev is already associated with a RIF, then we need to
|
|
|
|
* destroy it and create a new one with the new virtual router ID.
|
2017-03-16 16:08:18 +08:00
|
|
|
*/
|
2017-05-01 00:47:14 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
|
|
|
|
if (rif)
|
2018-12-19 14:08:47 +08:00
|
|
|
__mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_DOWN,
|
|
|
|
extack);
|
2017-03-16 16:08:18 +08:00
|
|
|
|
2018-12-19 14:08:47 +08:00
|
|
|
return __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_UP, extack);
|
2017-03-16 16:08:18 +08:00
|
|
|
}
|
|
|
|
|
2017-05-01 00:47:14 +08:00
|
|
|
static void mlxsw_sp_port_vrf_leave(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct net_device *l3_dev)
|
2017-03-16 16:08:18 +08:00
|
|
|
{
|
2017-05-01 00:47:14 +08:00
|
|
|
struct mlxsw_sp_rif *rif;
|
2017-03-16 16:08:18 +08:00
|
|
|
|
2017-05-01 00:47:14 +08:00
|
|
|
rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
|
|
|
|
if (!rif)
|
2017-03-16 16:08:18 +08:00
|
|
|
return;
|
2018-12-19 14:08:47 +08:00
|
|
|
__mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_DOWN, NULL);
|
2017-03-16 16:08:18 +08:00
|
|
|
}
|
|
|
|
|
2017-05-01 00:47:14 +08:00
|
|
|
int mlxsw_sp_netdevice_vrf_event(struct net_device *l3_dev, unsigned long event,
|
|
|
|
struct netdev_notifier_changeupper_info *info)
|
2017-03-16 16:08:19 +08:00
|
|
|
{
|
2017-05-01 00:47:14 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp = mlxsw_sp_lower_get(l3_dev);
|
|
|
|
int err = 0;
|
2017-03-16 16:08:19 +08:00
|
|
|
|
2018-07-14 16:39:51 +08:00
|
|
|
/* We do not create a RIF for a macvlan, but only use it to
|
|
|
|
* direct more MAC addresses to the router.
|
|
|
|
*/
|
|
|
|
if (!mlxsw_sp || netif_is_macvlan(l3_dev))
|
2017-05-01 00:47:14 +08:00
|
|
|
return 0;
|
2017-03-16 16:08:19 +08:00
|
|
|
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_lock(&mlxsw_sp->router->lock);
|
2017-05-01 00:47:14 +08:00
|
|
|
switch (event) {
|
|
|
|
case NETDEV_PRECHANGEUPPER:
|
2020-02-22 01:54:12 +08:00
|
|
|
break;
|
2017-05-01 00:47:14 +08:00
|
|
|
case NETDEV_CHANGEUPPER:
|
2017-10-19 00:56:56 +08:00
|
|
|
if (info->linking) {
|
|
|
|
struct netlink_ext_ack *extack;
|
|
|
|
|
|
|
|
extack = netdev_notifier_info_to_extack(&info->info);
|
|
|
|
err = mlxsw_sp_port_vrf_join(mlxsw_sp, l3_dev, extack);
|
|
|
|
} else {
|
2017-05-01 00:47:14 +08:00
|
|
|
mlxsw_sp_port_vrf_leave(mlxsw_sp, l3_dev);
|
2017-10-19 00:56:56 +08:00
|
|
|
}
|
2017-05-01 00:47:14 +08:00
|
|
|
break;
|
|
|
|
}
|
2020-02-22 01:54:12 +08:00
|
|
|
mutex_unlock(&mlxsw_sp->router->lock);
|
2017-03-16 16:08:19 +08:00
|
|
|
|
2017-05-01 00:47:14 +08:00
|
|
|
return err;
|
2017-03-16 16:08:19 +08:00
|
|
|
}
|
|
|
|
|
2018-07-14 16:39:52 +08:00
|
|
|
static int __mlxsw_sp_rif_macvlan_flush(struct net_device *dev, void *data)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *rif = data;
|
|
|
|
|
|
|
|
if (!netif_is_macvlan(dev))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
return mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), false);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_macvlan_flush(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
if (!netif_is_macvlan_port(rif->dev))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
netdev_warn(rif->dev, "Router interface is deleted. Upper macvlans will not work\n");
|
|
|
|
return netdev_walk_all_upper_dev_rcu(rif->dev,
|
|
|
|
__mlxsw_sp_rif_macvlan_flush, rif);
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static void mlxsw_sp_rif_subport_setup(struct mlxsw_sp_rif *rif,
|
|
|
|
const struct mlxsw_sp_rif_params *params)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_subport *rif_subport;
|
|
|
|
|
|
|
|
rif_subport = mlxsw_sp_rif_subport_rif(rif);
|
mlxsw: spectrum_router: Do not destroy RIFs based on FID's reference count
Currently, when a RIF is constructed on top of a FID, the RIF increments
the FID's reference count and the RIF is destroyed when the FID's
reference count drops to 1. This effectively means that when no local
ports are member in the FID, the FID is destroyed regardless if the
router port is a member in the FID or not.
The above can lead to the unexpected behavior in which routes using a
VLAN interface as their nexthop device are no longer offloaded after the
last local port leaves the corresponding VLAN (FID).
Example:
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1 offload
# bridge vlan del vid 10 dev swp3
# ip -4 route show dev br0.10
192.0.2.0/24 proto kernel scope link src 192.0.2.1
After the patch, the route is offloaded before and after the VLAN is
removed from local port 'swp3', as the RIF corresponding to 'br0.10'
continues to exists.
In order to remove RIFs' reliance on the underlying FID's reference
count, we need to add a reference count to sub-port RIFs, which are RIFs
that correspond to physical ports and their uppers (e.g., LAG devices).
In this case, each {Port, VID} ('struct mlxsw_sp_port_vlan') needs to
hold a reference on the RIF. For example:
bond0.10
|
bond0
|
+-------+
| |
swp1 swp2
Both {Port 1, VID 10} and {Port 2, VID 10} will hold a reference on the
RIF corresponding to 'bond0.10'. When the last reference is dropped, the
RIF will be destroyed.
Signed-off-by: Ido Schimmel <idosch@mellanox.com>
Reviewed-by: Petr Machata <petrm@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2018-12-19 14:08:38 +08:00
|
|
|
refcount_set(&rif_subport->ref_count, 1);
|
2017-05-26 14:37:40 +08:00
|
|
|
rif_subport->vid = params->vid;
|
|
|
|
rif_subport->lag = params->lag;
|
|
|
|
if (params->lag)
|
|
|
|
rif_subport->lag_id = params->lag_id;
|
2017-05-26 14:37:39 +08:00
|
|
|
else
|
2017-05-26 14:37:40 +08:00
|
|
|
rif_subport->system_port = params->system_port;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_subport_op(struct mlxsw_sp_rif *rif, bool enable)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_rif_subport *rif_subport;
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
|
|
|
|
rif_subport = mlxsw_sp_rif_subport_rif(rif);
|
|
|
|
mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_SP_IF,
|
2017-09-03 05:49:14 +08:00
|
|
|
rif->rif_index, rif->vr_id, rif->dev->mtu);
|
|
|
|
mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_reg_ritr_sp_if_pack(ritr_pl, rif_subport->lag,
|
|
|
|
rif_subport->lag ? rif_subport->lag_id :
|
|
|
|
rif_subport->system_port,
|
|
|
|
rif_subport->vid);
|
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_subport_configure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
2017-09-03 05:49:18 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_subport_op(rif, true);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), true);
|
|
|
|
if (err)
|
|
|
|
goto err_rif_fdb_op;
|
|
|
|
|
|
|
|
mlxsw_sp_fid_rif_set(rif->fid, rif);
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_rif_fdb_op:
|
|
|
|
mlxsw_sp_rif_subport_op(rif, false);
|
|
|
|
return err;
|
2017-05-26 14:37:39 +08:00
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static void mlxsw_sp_rif_subport_deconfigure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
2017-09-03 05:49:18 +08:00
|
|
|
struct mlxsw_sp_fid *fid = rif->fid;
|
|
|
|
|
|
|
|
mlxsw_sp_fid_rif_set(fid, NULL);
|
|
|
|
mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(fid), false);
|
2018-07-14 16:39:52 +08:00
|
|
|
mlxsw_sp_rif_macvlan_flush(rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_subport_op(rif, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fid *
|
2018-06-25 15:48:13 +08:00
|
|
|
mlxsw_sp_rif_subport_fid_get(struct mlxsw_sp_rif *rif,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-05-26 14:37:40 +08:00
|
|
|
{
|
|
|
|
return mlxsw_sp_fid_rfid_get(rif->mlxsw_sp, rif->rif_index);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_subport_ops = {
|
|
|
|
.type = MLXSW_SP_RIF_TYPE_SUBPORT,
|
|
|
|
.rif_size = sizeof(struct mlxsw_sp_rif_subport),
|
|
|
|
.setup = mlxsw_sp_rif_subport_setup,
|
|
|
|
.configure = mlxsw_sp_rif_subport_configure,
|
|
|
|
.deconfigure = mlxsw_sp_rif_subport_deconfigure,
|
|
|
|
.fid_get = mlxsw_sp_rif_subport_fid_get,
|
|
|
|
};
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_vlan_fid_op(struct mlxsw_sp_rif *rif,
|
|
|
|
enum mlxsw_reg_ritr_if_type type,
|
|
|
|
u16 vid_fid, bool enable)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_pack(ritr_pl, enable, type, rif->rif_index, rif->vr_id,
|
2017-09-03 05:49:14 +08:00
|
|
|
rif->dev->mtu);
|
|
|
|
mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_reg_ritr_fid_set(ritr_pl, type, vid_fid);
|
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
2017-10-09 17:15:33 +08:00
|
|
|
u8 mlxsw_sp_router_port(const struct mlxsw_sp *mlxsw_sp)
|
2017-05-26 14:37:40 +08:00
|
|
|
{
|
|
|
|
return mlxsw_core_max_ports(mlxsw_sp->core) + 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_vlan_configure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, true);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-07-18 16:10:12 +08:00
|
|
|
err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), true);
|
|
|
|
if (err)
|
|
|
|
goto err_fid_mc_flood_set;
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), true);
|
|
|
|
if (err)
|
|
|
|
goto err_fid_bc_flood_set;
|
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), true);
|
|
|
|
if (err)
|
|
|
|
goto err_rif_fdb_op;
|
|
|
|
|
|
|
|
mlxsw_sp_fid_rif_set(rif->fid, rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
return 0;
|
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
err_rif_fdb_op:
|
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
2017-05-26 14:37:40 +08:00
|
|
|
err_fid_bc_flood_set:
|
2017-07-18 16:10:12 +08:00
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
|
|
|
err_fid_mc_flood_set:
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, false);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_rif_vlan_deconfigure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
|
2017-09-03 05:49:18 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_fid *fid = rif->fid;
|
2017-05-26 14:37:40 +08:00
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
mlxsw_sp_fid_rif_set(fid, NULL);
|
|
|
|
mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(fid), false);
|
2018-07-14 16:39:52 +08:00
|
|
|
mlxsw_sp_rif_macvlan_flush(rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
2017-07-18 16:10:12 +08:00
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fid *
|
2018-06-25 15:48:13 +08:00
|
|
|
mlxsw_sp_rif_vlan_fid_get(struct mlxsw_sp_rif *rif,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-05-26 14:37:40 +08:00
|
|
|
{
|
2018-12-21 03:42:23 +08:00
|
|
|
struct net_device *br_dev = rif->dev;
|
2018-06-25 15:48:14 +08:00
|
|
|
u16 vid;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (is_vlan_dev(rif->dev)) {
|
|
|
|
vid = vlan_dev_vlan_id(rif->dev);
|
2018-12-21 03:42:23 +08:00
|
|
|
br_dev = vlan_dev_real_dev(rif->dev);
|
|
|
|
if (WARN_ON(!netif_is_bridge_master(br_dev)))
|
|
|
|
return ERR_PTR(-EINVAL);
|
2018-06-25 15:48:14 +08:00
|
|
|
} else {
|
|
|
|
err = br_vlan_get_pvid(rif->dev, &vid);
|
2018-07-06 20:44:45 +08:00
|
|
|
if (err < 0 || !vid) {
|
2018-06-25 15:48:14 +08:00
|
|
|
NL_SET_ERR_MSG_MOD(extack, "Couldn't determine bridge PVID");
|
2018-07-06 20:44:45 +08:00
|
|
|
return ERR_PTR(-EINVAL);
|
2018-06-25 15:48:14 +08:00
|
|
|
}
|
|
|
|
}
|
2017-05-26 14:37:40 +08:00
|
|
|
|
2020-02-17 22:29:35 +08:00
|
|
|
return mlxsw_sp_fid_8021q_get(rif->mlxsw_sp, vid);
|
2017-05-26 14:37:40 +08:00
|
|
|
}
|
|
|
|
|
2018-07-14 16:39:52 +08:00
|
|
|
static void mlxsw_sp_rif_vlan_fdb_del(struct mlxsw_sp_rif *rif, const char *mac)
|
|
|
|
{
|
|
|
|
u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
|
|
|
|
struct switchdev_notifier_fdb_info info;
|
|
|
|
struct net_device *br_dev;
|
|
|
|
struct net_device *dev;
|
|
|
|
|
|
|
|
br_dev = is_vlan_dev(rif->dev) ? vlan_dev_real_dev(rif->dev) : rif->dev;
|
|
|
|
dev = br_fdb_find_port(br_dev, mac, vid);
|
|
|
|
if (!dev)
|
|
|
|
return;
|
|
|
|
|
|
|
|
info.addr = mac;
|
|
|
|
info.vid = vid;
|
2019-01-17 07:06:56 +08:00
|
|
|
call_switchdev_notifiers(SWITCHDEV_FDB_DEL_TO_BRIDGE, dev, &info.info,
|
|
|
|
NULL);
|
2018-07-14 16:39:52 +08:00
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_vlan_ops = {
|
|
|
|
.type = MLXSW_SP_RIF_TYPE_VLAN,
|
|
|
|
.rif_size = sizeof(struct mlxsw_sp_rif),
|
|
|
|
.configure = mlxsw_sp_rif_vlan_configure,
|
|
|
|
.deconfigure = mlxsw_sp_rif_vlan_deconfigure,
|
|
|
|
.fid_get = mlxsw_sp_rif_vlan_fid_get,
|
2018-07-14 16:39:52 +08:00
|
|
|
.fdb_del = mlxsw_sp_rif_vlan_fdb_del,
|
2017-05-26 14:37:40 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static int mlxsw_sp_rif_fid_configure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
u16 fid_index = mlxsw_sp_fid_index(rif->fid);
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index,
|
|
|
|
true);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-07-18 16:10:12 +08:00
|
|
|
err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), true);
|
|
|
|
if (err)
|
|
|
|
goto err_fid_mc_flood_set;
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), true);
|
|
|
|
if (err)
|
|
|
|
goto err_fid_bc_flood_set;
|
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(rif->fid), true);
|
|
|
|
if (err)
|
|
|
|
goto err_rif_fdb_op;
|
|
|
|
|
|
|
|
mlxsw_sp_fid_rif_set(rif->fid, rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
return 0;
|
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
err_rif_fdb_op:
|
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
2017-05-26 14:37:40 +08:00
|
|
|
err_fid_bc_flood_set:
|
2017-07-18 16:10:12 +08:00
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
|
|
|
err_fid_mc_flood_set:
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index, false);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_rif_fid_deconfigure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
u16 fid_index = mlxsw_sp_fid_index(rif->fid);
|
2017-09-03 05:49:18 +08:00
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_fid *fid = rif->fid;
|
2017-05-26 14:37:40 +08:00
|
|
|
|
2017-09-03 05:49:18 +08:00
|
|
|
mlxsw_sp_fid_rif_set(fid, NULL);
|
|
|
|
mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
|
|
|
|
mlxsw_sp_fid_index(fid), false);
|
2018-07-14 16:39:52 +08:00
|
|
|
mlxsw_sp_rif_macvlan_flush(rif);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
2017-07-18 16:10:12 +08:00
|
|
|
mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
|
|
|
|
mlxsw_sp_router_port(mlxsw_sp), false);
|
2017-05-26 14:37:40 +08:00
|
|
|
mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_fid *
|
2018-06-25 15:48:13 +08:00
|
|
|
mlxsw_sp_rif_fid_fid_get(struct mlxsw_sp_rif *rif,
|
|
|
|
struct netlink_ext_ack *extack)
|
2017-05-26 14:37:40 +08:00
|
|
|
{
|
2020-02-17 22:29:35 +08:00
|
|
|
return mlxsw_sp_fid_8021d_get(rif->mlxsw_sp, rif->dev->ifindex);
|
2017-05-26 14:37:40 +08:00
|
|
|
}
|
|
|
|
|
2018-07-14 16:39:52 +08:00
|
|
|
static void mlxsw_sp_rif_fid_fdb_del(struct mlxsw_sp_rif *rif, const char *mac)
|
|
|
|
{
|
|
|
|
struct switchdev_notifier_fdb_info info;
|
|
|
|
struct net_device *dev;
|
|
|
|
|
|
|
|
dev = br_fdb_find_port(rif->dev, mac, 0);
|
|
|
|
if (!dev)
|
|
|
|
return;
|
|
|
|
|
|
|
|
info.addr = mac;
|
|
|
|
info.vid = 0;
|
2019-01-17 07:06:56 +08:00
|
|
|
call_switchdev_notifiers(SWITCHDEV_FDB_DEL_TO_BRIDGE, dev, &info.info,
|
|
|
|
NULL);
|
2018-07-14 16:39:52 +08:00
|
|
|
}
|
|
|
|
|
2017-05-26 14:37:40 +08:00
|
|
|
static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_fid_ops = {
|
|
|
|
.type = MLXSW_SP_RIF_TYPE_FID,
|
|
|
|
.rif_size = sizeof(struct mlxsw_sp_rif),
|
|
|
|
.configure = mlxsw_sp_rif_fid_configure,
|
|
|
|
.deconfigure = mlxsw_sp_rif_fid_deconfigure,
|
|
|
|
.fid_get = mlxsw_sp_rif_fid_fid_get,
|
2018-07-14 16:39:52 +08:00
|
|
|
.fdb_del = mlxsw_sp_rif_fid_fdb_del,
|
2017-05-26 14:37:40 +08:00
|
|
|
};
|
|
|
|
|
2018-11-25 17:43:58 +08:00
|
|
|
static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_vlan_emu_ops = {
|
|
|
|
.type = MLXSW_SP_RIF_TYPE_VLAN,
|
|
|
|
.rif_size = sizeof(struct mlxsw_sp_rif),
|
|
|
|
.configure = mlxsw_sp_rif_fid_configure,
|
|
|
|
.deconfigure = mlxsw_sp_rif_fid_deconfigure,
|
|
|
|
.fid_get = mlxsw_sp_rif_vlan_fid_get,
|
|
|
|
.fdb_del = mlxsw_sp_rif_vlan_fdb_del,
|
|
|
|
};
|
|
|
|
|
2017-09-03 05:49:19 +08:00
|
|
|
static struct mlxsw_sp_rif_ipip_lb *
|
|
|
|
mlxsw_sp_rif_ipip_lb_rif(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
|
|
|
return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
mlxsw_sp_rif_ipip_lb_setup(struct mlxsw_sp_rif *rif,
|
|
|
|
const struct mlxsw_sp_rif_params *params)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_params_ipip_lb *params_lb;
|
|
|
|
struct mlxsw_sp_rif_ipip_lb *rif_lb;
|
|
|
|
|
|
|
|
params_lb = container_of(params, struct mlxsw_sp_rif_params_ipip_lb,
|
|
|
|
common);
|
|
|
|
rif_lb = mlxsw_sp_rif_ipip_lb_rif(rif);
|
|
|
|
rif_lb->lb_config = params_lb->lb_config;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
2019-01-20 14:50:40 +08:00
|
|
|
mlxsw_sp1_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif)
|
2017-09-03 05:49:19 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
|
|
|
|
u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_vr *ul_vr;
|
|
|
|
int err;
|
|
|
|
|
2017-10-19 00:56:56 +08:00
|
|
|
ul_vr = mlxsw_sp_vr_get(mlxsw_sp, ul_tb_id, NULL);
|
2017-09-03 05:49:19 +08:00
|
|
|
if (IS_ERR(ul_vr))
|
|
|
|
return PTR_ERR(ul_vr);
|
|
|
|
|
2019-01-20 14:50:42 +08:00
|
|
|
err = mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr->id, 0, true);
|
2017-09-03 05:49:19 +08:00
|
|
|
if (err)
|
|
|
|
goto err_loopback_op;
|
|
|
|
|
|
|
|
lb_rif->ul_vr_id = ul_vr->id;
|
2019-01-20 14:50:47 +08:00
|
|
|
lb_rif->ul_rif_id = 0;
|
2017-09-03 05:49:19 +08:00
|
|
|
++ul_vr->rif_count;
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
err_loopback_op:
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, ul_vr);
|
2017-09-03 05:49:19 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2019-01-20 14:50:40 +08:00
|
|
|
static void mlxsw_sp1_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif)
|
2017-09-03 05:49:19 +08:00
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_vr *ul_vr;
|
|
|
|
|
|
|
|
ul_vr = &mlxsw_sp->router->vrs[lb_rif->ul_vr_id];
|
2019-01-20 14:50:42 +08:00
|
|
|
mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr->id, 0, false);
|
2017-09-03 05:49:19 +08:00
|
|
|
|
|
|
|
--ul_vr->rif_count;
|
2018-01-22 16:17:42 +08:00
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, ul_vr);
|
2017-09-03 05:49:19 +08:00
|
|
|
}
|
|
|
|
|
2019-01-20 14:50:40 +08:00
|
|
|
static const struct mlxsw_sp_rif_ops mlxsw_sp1_rif_ipip_lb_ops = {
|
2017-09-03 05:49:19 +08:00
|
|
|
.type = MLXSW_SP_RIF_TYPE_IPIP_LB,
|
|
|
|
.rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb),
|
|
|
|
.setup = mlxsw_sp_rif_ipip_lb_setup,
|
2019-01-20 14:50:40 +08:00
|
|
|
.configure = mlxsw_sp1_rif_ipip_lb_configure,
|
|
|
|
.deconfigure = mlxsw_sp1_rif_ipip_lb_deconfigure,
|
2017-09-03 05:49:19 +08:00
|
|
|
};
|
|
|
|
|
2019-01-20 14:50:40 +08:00
|
|
|
const struct mlxsw_sp_rif_ops *mlxsw_sp1_rif_ops_arr[] = {
|
2017-05-26 14:37:40 +08:00
|
|
|
[MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops,
|
2018-11-25 17:43:59 +08:00
|
|
|
[MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp_rif_vlan_emu_ops,
|
2017-05-26 14:37:40 +08:00
|
|
|
[MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops,
|
2019-01-20 14:50:40 +08:00
|
|
|
[MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp1_rif_ipip_lb_ops,
|
|
|
|
};
|
|
|
|
|
2019-01-20 14:50:51 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_rif_ipip_lb_ul_rif_op(struct mlxsw_sp_rif *ul_rif, bool enable)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp;
|
|
|
|
char ritr_pl[MLXSW_REG_RITR_LEN];
|
|
|
|
|
|
|
|
mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF,
|
|
|
|
ul_rif->rif_index, ul_rif->vr_id, IP_MAX_MTU);
|
|
|
|
mlxsw_reg_ritr_loopback_protocol_set(ritr_pl,
|
|
|
|
MLXSW_REG_RITR_LOOPBACK_GENERIC);
|
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_rif *
|
|
|
|
mlxsw_sp_ul_rif_create(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_vr *vr,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *ul_rif;
|
|
|
|
u16 rif_index;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index);
|
|
|
|
if (err) {
|
|
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interfaces");
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
ul_rif = mlxsw_sp_rif_alloc(sizeof(*ul_rif), rif_index, vr->id, NULL);
|
|
|
|
if (!ul_rif)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
|
|
|
|
mlxsw_sp->router->rifs[rif_index] = ul_rif;
|
|
|
|
ul_rif->mlxsw_sp = mlxsw_sp;
|
|
|
|
err = mlxsw_sp_rif_ipip_lb_ul_rif_op(ul_rif, true);
|
|
|
|
if (err)
|
|
|
|
goto ul_rif_op_err;
|
|
|
|
|
|
|
|
return ul_rif;
|
|
|
|
|
|
|
|
ul_rif_op_err:
|
|
|
|
mlxsw_sp->router->rifs[rif_index] = NULL;
|
|
|
|
kfree(ul_rif);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_ul_rif_destroy(struct mlxsw_sp_rif *ul_rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp;
|
|
|
|
|
|
|
|
mlxsw_sp_rif_ipip_lb_ul_rif_op(ul_rif, false);
|
|
|
|
mlxsw_sp->router->rifs[ul_rif->rif_index] = NULL;
|
|
|
|
kfree(ul_rif);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct mlxsw_sp_rif *
|
|
|
|
mlxsw_sp_ul_rif_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
|
|
|
|
struct netlink_ext_ack *extack)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, extack);
|
|
|
|
if (IS_ERR(vr))
|
|
|
|
return ERR_CAST(vr);
|
|
|
|
|
|
|
|
if (refcount_inc_not_zero(&vr->ul_rif_refcnt))
|
|
|
|
return vr->ul_rif;
|
|
|
|
|
|
|
|
vr->ul_rif = mlxsw_sp_ul_rif_create(mlxsw_sp, vr, extack);
|
|
|
|
if (IS_ERR(vr->ul_rif)) {
|
|
|
|
err = PTR_ERR(vr->ul_rif);
|
|
|
|
goto err_ul_rif_create;
|
|
|
|
}
|
|
|
|
|
|
|
|
vr->rif_count++;
|
|
|
|
refcount_set(&vr->ul_rif_refcnt, 1);
|
|
|
|
|
|
|
|
return vr->ul_rif;
|
|
|
|
|
|
|
|
err_ul_rif_create:
|
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
|
|
|
return ERR_PTR(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_ul_rif_put(struct mlxsw_sp_rif *ul_rif)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_vr *vr;
|
|
|
|
|
|
|
|
vr = &mlxsw_sp->router->vrs[ul_rif->vr_id];
|
|
|
|
|
|
|
|
if (!refcount_dec_and_test(&vr->ul_rif_refcnt))
|
|
|
|
return;
|
|
|
|
|
|
|
|
vr->rif_count--;
|
|
|
|
mlxsw_sp_ul_rif_destroy(ul_rif);
|
|
|
|
mlxsw_sp_vr_put(mlxsw_sp, vr);
|
|
|
|
}
|
|
|
|
|
2019-01-23 22:32:55 +08:00
|
|
|
int mlxsw_sp_router_ul_rif_get(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id,
|
|
|
|
u16 *ul_rif_index)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *ul_rif;
|
|
|
|
|
|
|
|
ASSERT_RTNL();
|
|
|
|
|
|
|
|
ul_rif = mlxsw_sp_ul_rif_get(mlxsw_sp, ul_tb_id, NULL);
|
|
|
|
if (IS_ERR(ul_rif))
|
|
|
|
return PTR_ERR(ul_rif);
|
|
|
|
*ul_rif_index = ul_rif->rif_index;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void mlxsw_sp_router_ul_rif_put(struct mlxsw_sp *mlxsw_sp, u16 ul_rif_index)
|
|
|
|
{
|
|
|
|
struct mlxsw_sp_rif *ul_rif;
|
|
|
|
|
|
|
|
ASSERT_RTNL();
|
|
|
|
|
|
|
|
ul_rif = mlxsw_sp->router->rifs[ul_rif_index];
|
|
|
|
if (WARN_ON(!ul_rif))
|
|
|
|
return;
|
|
|
|
|
|
|
|
mlxsw_sp_ul_rif_put(ul_rif);
|
|
|
|
}
|
|
|
|
|
2019-01-20 14:50:40 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp2_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
2019-01-20 14:50:51 +08:00
|
|
|
struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
|
|
|
|
u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_rif *ul_rif;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
ul_rif = mlxsw_sp_ul_rif_get(mlxsw_sp, ul_tb_id, NULL);
|
|
|
|
if (IS_ERR(ul_rif))
|
|
|
|
return PTR_ERR(ul_rif);
|
|
|
|
|
|
|
|
err = mlxsw_sp_rif_ipip_lb_op(lb_rif, 0, ul_rif->rif_index, true);
|
|
|
|
if (err)
|
|
|
|
goto err_loopback_op;
|
|
|
|
|
|
|
|
lb_rif->ul_vr_id = 0;
|
|
|
|
lb_rif->ul_rif_id = ul_rif->rif_index;
|
|
|
|
|
2019-01-20 14:50:40 +08:00
|
|
|
return 0;
|
2019-01-20 14:50:51 +08:00
|
|
|
|
|
|
|
err_loopback_op:
|
|
|
|
mlxsw_sp_ul_rif_put(ul_rif);
|
|
|
|
return err;
|
2019-01-20 14:50:40 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp2_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif)
|
|
|
|
{
|
2019-01-20 14:50:51 +08:00
|
|
|
struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
|
|
|
|
struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
|
|
|
|
struct mlxsw_sp_rif *ul_rif;
|
|
|
|
|
|
|
|
ul_rif = mlxsw_sp_rif_by_index(mlxsw_sp, lb_rif->ul_rif_id);
|
|
|
|
mlxsw_sp_rif_ipip_lb_op(lb_rif, 0, lb_rif->ul_rif_id, false);
|
|
|
|
mlxsw_sp_ul_rif_put(ul_rif);
|
2019-01-20 14:50:40 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static const struct mlxsw_sp_rif_ops mlxsw_sp2_rif_ipip_lb_ops = {
|
|
|
|
.type = MLXSW_SP_RIF_TYPE_IPIP_LB,
|
|
|
|
.rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb),
|
|
|
|
.setup = mlxsw_sp_rif_ipip_lb_setup,
|
|
|
|
.configure = mlxsw_sp2_rif_ipip_lb_configure,
|
|
|
|
.deconfigure = mlxsw_sp2_rif_ipip_lb_deconfigure,
|
|
|
|
};
|
|
|
|
|
|
|
|
const struct mlxsw_sp_rif_ops *mlxsw_sp2_rif_ops_arr[] = {
|
|
|
|
[MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops,
|
|
|
|
[MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp_rif_vlan_emu_ops,
|
|
|
|
[MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops,
|
|
|
|
[MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp2_rif_ipip_lb_ops,
|
2017-05-26 14:37:40 +08:00
|
|
|
};
|
|
|
|
|
2017-05-17 01:38:29 +08:00
|
|
|
static int mlxsw_sp_rifs_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
u64 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS);
|
|
|
|
|
|
|
|
mlxsw_sp->router->rifs = kcalloc(max_rifs,
|
|
|
|
sizeof(struct mlxsw_sp_rif *),
|
|
|
|
GFP_KERNEL);
|
|
|
|
if (!mlxsw_sp->router->rifs)
|
|
|
|
return -ENOMEM;
|
2017-05-26 14:37:40 +08:00
|
|
|
|
2017-05-17 01:38:29 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_rifs_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++)
|
|
|
|
WARN_ON_ONCE(mlxsw_sp->router->rifs[i]);
|
|
|
|
|
|
|
|
kfree(mlxsw_sp->router->rifs);
|
|
|
|
}
|
|
|
|
|
2017-10-20 15:16:16 +08:00
|
|
|
static int
|
|
|
|
mlxsw_sp_ipip_config_tigcr(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
char tigcr_pl[MLXSW_REG_TIGCR_LEN];
|
|
|
|
|
|
|
|
mlxsw_reg_tigcr_pack(tigcr_pl, true, 0);
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tigcr), tigcr_pl);
|
|
|
|
}
|
|
|
|
|
2017-09-03 05:49:17 +08:00
|
|
|
static int mlxsw_sp_ipips_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2020-01-19 21:00:52 +08:00
|
|
|
int err;
|
|
|
|
|
2017-09-03 05:49:17 +08:00
|
|
|
mlxsw_sp->router->ipip_ops_arr = mlxsw_sp_ipip_ops_arr;
|
2017-09-03 05:49:23 +08:00
|
|
|
INIT_LIST_HEAD(&mlxsw_sp->router->ipip_list);
|
2020-01-19 21:00:52 +08:00
|
|
|
|
|
|
|
err = mlxsw_sp_ipip_ecn_encap_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
err = mlxsw_sp_ipip_ecn_decap_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2017-10-20 15:16:16 +08:00
|
|
|
return mlxsw_sp_ipip_config_tigcr(mlxsw_sp);
|
2017-09-03 05:49:17 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_ipips_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2017-09-03 05:49:23 +08:00
|
|
|
WARN_ON(!list_empty(&mlxsw_sp->router->ipip_list));
|
2017-09-03 05:49:17 +08:00
|
|
|
}
|
|
|
|
|
2016-12-03 23:45:07 +08:00
|
|
|
static void mlxsw_sp_router_fib_dump_flush(struct notifier_block *nb)
|
|
|
|
{
|
2017-05-17 01:38:28 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2016-12-03 23:45:07 +08:00
|
|
|
|
|
|
|
/* Flush pending FIB notifications and then flush the device's
|
|
|
|
* table before requesting another dump. The FIB notification
|
|
|
|
* block is unregistered, so no need to take RTNL.
|
|
|
|
*/
|
|
|
|
mlxsw_core_flush_owq();
|
2017-05-17 01:38:28 +08:00
|
|
|
router = container_of(nb, struct mlxsw_sp_router, fib_nb);
|
|
|
|
mlxsw_sp_router_fib_flush(router->mlxsw_sp);
|
2016-12-03 23:45:07 +08:00
|
|
|
}
|
|
|
|
|
2017-11-03 00:14:09 +08:00
|
|
|
#ifdef CONFIG_IP_ROUTE_MULTIPATH
|
|
|
|
static void mlxsw_sp_mp_hash_header_set(char *recr2_pl, int header)
|
|
|
|
{
|
|
|
|
mlxsw_reg_recr2_outer_header_enables_set(recr2_pl, header, true);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void mlxsw_sp_mp_hash_field_set(char *recr2_pl, int field)
|
|
|
|
{
|
|
|
|
mlxsw_reg_recr2_outer_header_fields_enable_set(recr2_pl, field, true);
|
|
|
|
}
|
|
|
|
|
2019-10-03 17:49:32 +08:00
|
|
|
static void mlxsw_sp_mp4_hash_init(struct mlxsw_sp *mlxsw_sp, char *recr2_pl)
|
2017-11-03 00:14:09 +08:00
|
|
|
{
|
2019-10-03 17:49:32 +08:00
|
|
|
struct net *net = mlxsw_sp_net(mlxsw_sp);
|
|
|
|
bool only_l3 = !net->ipv4.sysctl_fib_multipath_hash_policy;
|
2017-11-03 00:14:09 +08:00
|
|
|
|
|
|
|
mlxsw_sp_mp_hash_header_set(recr2_pl,
|
|
|
|
MLXSW_REG_RECR2_IPV4_EN_NOT_TCP_NOT_UDP);
|
|
|
|
mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_IPV4_EN_TCP_UDP);
|
|
|
|
mlxsw_reg_recr2_ipv4_sip_enable(recr2_pl);
|
|
|
|
mlxsw_reg_recr2_ipv4_dip_enable(recr2_pl);
|
|
|
|
if (only_l3)
|
|
|
|
return;
|
|
|
|
mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_EN_IPV4);
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV4_PROTOCOL);
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_SPORT);
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_DPORT);
|
|
|
|
}
|
|
|
|
|
2019-10-03 17:49:32 +08:00
|
|
|
static void mlxsw_sp_mp6_hash_init(struct mlxsw_sp *mlxsw_sp, char *recr2_pl)
|
2017-11-03 00:14:09 +08:00
|
|
|
{
|
2019-10-03 17:49:32 +08:00
|
|
|
bool only_l3 = !ip6_multipath_hash_policy(mlxsw_sp_net(mlxsw_sp));
|
2018-03-03 00:32:19 +08:00
|
|
|
|
2017-11-03 00:14:09 +08:00
|
|
|
mlxsw_sp_mp_hash_header_set(recr2_pl,
|
|
|
|
MLXSW_REG_RECR2_IPV6_EN_NOT_TCP_NOT_UDP);
|
|
|
|
mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_IPV6_EN_TCP_UDP);
|
|
|
|
mlxsw_reg_recr2_ipv6_sip_enable(recr2_pl);
|
|
|
|
mlxsw_reg_recr2_ipv6_dip_enable(recr2_pl);
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV6_NEXT_HEADER);
|
2018-03-03 00:32:19 +08:00
|
|
|
if (only_l3) {
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl,
|
|
|
|
MLXSW_REG_RECR2_IPV6_FLOW_LABEL);
|
|
|
|
} else {
|
|
|
|
mlxsw_sp_mp_hash_header_set(recr2_pl,
|
|
|
|
MLXSW_REG_RECR2_TCP_UDP_EN_IPV6);
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl,
|
|
|
|
MLXSW_REG_RECR2_TCP_UDP_SPORT);
|
|
|
|
mlxsw_sp_mp_hash_field_set(recr2_pl,
|
|
|
|
MLXSW_REG_RECR2_TCP_UDP_DPORT);
|
|
|
|
}
|
2017-11-03 00:14:09 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
char recr2_pl[MLXSW_REG_RECR2_LEN];
|
|
|
|
u32 seed;
|
|
|
|
|
2019-04-21 15:18:34 +08:00
|
|
|
seed = jhash(mlxsw_sp->base_mac, sizeof(mlxsw_sp->base_mac), 0);
|
2017-11-03 00:14:09 +08:00
|
|
|
mlxsw_reg_recr2_pack(recr2_pl, seed);
|
2019-10-03 17:49:32 +08:00
|
|
|
mlxsw_sp_mp4_hash_init(mlxsw_sp, recr2_pl);
|
|
|
|
mlxsw_sp_mp6_hash_init(mlxsw_sp, recr2_pl);
|
2017-11-03 00:14:09 +08:00
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(recr2), recr2_pl);
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2018-01-14 19:33:14 +08:00
|
|
|
static int mlxsw_sp_dscp_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
char rdpm_pl[MLXSW_REG_RDPM_LEN];
|
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
MLXSW_REG_ZERO(rdpm, rdpm_pl);
|
|
|
|
|
|
|
|
/* HW is determining switch priority based on DSCP-bits, but the
|
|
|
|
* kernel is still doing that based on the ToS. Since there's a
|
|
|
|
* mismatch in bits we need to make sure to translate the right
|
|
|
|
* value ToS would observe, skipping the 2 least-significant ECN bits.
|
|
|
|
*/
|
|
|
|
for (i = 0; i < MLXSW_REG_RDPM_DSCP_ENTRY_REC_MAX_COUNT; i++)
|
|
|
|
mlxsw_reg_rdpm_pack(rdpm_pl, i, rt_tos2priority(i << 2));
|
|
|
|
|
|
|
|
return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rdpm), rdpm_pl);
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:53:39 +08:00
|
|
|
static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2019-10-03 17:49:32 +08:00
|
|
|
struct net *net = mlxsw_sp_net(mlxsw_sp);
|
|
|
|
bool usp = net->ipv4.sysctl_ip_fwd_update_priority;
|
2017-03-10 15:53:39 +08:00
|
|
|
char rgcr_pl[MLXSW_REG_RGCR_LEN];
|
|
|
|
u64 max_rifs;
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_RIFS))
|
|
|
|
return -EIO;
|
|
|
|
max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS);
|
|
|
|
|
2017-07-18 16:10:09 +08:00
|
|
|
mlxsw_reg_rgcr_pack(rgcr_pl, true, true);
|
2017-03-10 15:53:39 +08:00
|
|
|
mlxsw_reg_rgcr_max_router_interfaces_set(rgcr_pl, max_rifs);
|
2018-08-01 06:38:03 +08:00
|
|
|
mlxsw_reg_rgcr_usp_set(rgcr_pl, usp);
|
2017-03-10 15:53:39 +08:00
|
|
|
err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl);
|
|
|
|
if (err)
|
2017-05-17 01:38:29 +08:00
|
|
|
return err;
|
2017-03-10 15:53:39 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void __mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
|
|
|
char rgcr_pl[MLXSW_REG_RGCR_LEN];
|
|
|
|
|
2017-07-18 16:10:09 +08:00
|
|
|
mlxsw_reg_rgcr_pack(rgcr_pl, false, false);
|
2017-03-10 15:53:39 +08:00
|
|
|
mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl);
|
|
|
|
}
|
|
|
|
|
2019-10-03 17:49:34 +08:00
|
|
|
int mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp,
|
|
|
|
struct netlink_ext_ack *extack)
|
2016-09-26 18:52:31 +08:00
|
|
|
{
|
2017-05-17 01:38:25 +08:00
|
|
|
struct mlxsw_sp_router *router;
|
2016-09-26 18:52:31 +08:00
|
|
|
int err;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
router = kzalloc(sizeof(*mlxsw_sp->router), GFP_KERNEL);
|
|
|
|
if (!router)
|
|
|
|
return -ENOMEM;
|
2020-02-22 01:54:09 +08:00
|
|
|
mutex_init(&router->lock);
|
2017-05-17 01:38:25 +08:00
|
|
|
mlxsw_sp->router = router;
|
|
|
|
router->mlxsw_sp = mlxsw_sp;
|
|
|
|
|
2018-12-19 14:08:48 +08:00
|
|
|
router->inetaddr_nb.notifier_call = mlxsw_sp_inetaddr_event;
|
|
|
|
err = register_inetaddr_notifier(&router->inetaddr_nb);
|
|
|
|
if (err)
|
|
|
|
goto err_register_inetaddr_notifier;
|
|
|
|
|
|
|
|
router->inet6addr_nb.notifier_call = mlxsw_sp_inet6addr_event;
|
|
|
|
err = register_inet6addr_notifier(&router->inet6addr_nb);
|
|
|
|
if (err)
|
|
|
|
goto err_register_inet6addr_notifier;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_neighs_list);
|
2016-09-26 18:52:31 +08:00
|
|
|
err = __mlxsw_sp_router_init(mlxsw_sp);
|
|
|
|
if (err)
|
2017-05-17 01:38:25 +08:00
|
|
|
goto err_router_init;
|
2016-09-26 18:52:31 +08:00
|
|
|
|
2017-05-17 01:38:29 +08:00
|
|
|
err = mlxsw_sp_rifs_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
goto err_rifs_init;
|
|
|
|
|
2017-09-03 05:49:17 +08:00
|
|
|
err = mlxsw_sp_ipips_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
goto err_ipips_init;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
err = rhashtable_init(&mlxsw_sp->router->nexthop_ht,
|
2017-02-08 18:16:30 +08:00
|
|
|
&mlxsw_sp_nexthop_ht_params);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop_ht_init;
|
|
|
|
|
2017-05-17 01:38:25 +08:00
|
|
|
err = rhashtable_init(&mlxsw_sp->router->nexthop_group_ht,
|
2017-02-08 18:16:29 +08:00
|
|
|
&mlxsw_sp_nexthop_group_ht_params);
|
|
|
|
if (err)
|
|
|
|
goto err_nexthop_group_ht_init;
|
|
|
|
|
2017-09-25 16:32:23 +08:00
|
|
|
INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_list);
|
2017-03-24 15:02:47 +08:00
|
|
|
err = mlxsw_sp_lpm_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
goto err_lpm_init;
|
|
|
|
|
2017-09-27 14:23:20 +08:00
|
|
|
err = mlxsw_sp_mr_init(mlxsw_sp, &mlxsw_sp_mr_tcam_ops);
|
|
|
|
if (err)
|
|
|
|
goto err_mr_init;
|
|
|
|
|
2016-09-26 18:52:31 +08:00
|
|
|
err = mlxsw_sp_vrs_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
goto err_vrs_init;
|
|
|
|
|
2016-10-27 21:12:57 +08:00
|
|
|
err = mlxsw_sp_neigh_init(mlxsw_sp);
|
2016-09-26 18:52:31 +08:00
|
|
|
if (err)
|
|
|
|
goto err_neigh_init;
|
|
|
|
|
2017-11-03 00:14:06 +08:00
|
|
|
mlxsw_sp->router->netevent_nb.notifier_call =
|
|
|
|
mlxsw_sp_router_netevent_event;
|
|
|
|
err = register_netevent_notifier(&mlxsw_sp->router->netevent_nb);
|
|
|
|
if (err)
|
|
|
|
goto err_register_netevent_notifier;
|
|
|
|
|
2017-11-03 00:14:09 +08:00
|
|
|
err = mlxsw_sp_mp_hash_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
goto err_mp_hash_init;
|
|
|
|
|
2018-01-14 19:33:14 +08:00
|
|
|
err = mlxsw_sp_dscp_init(mlxsw_sp);
|
|
|
|
if (err)
|
|
|
|
goto err_dscp_init;
|
|
|
|
|
2017-05-17 01:38:28 +08:00
|
|
|
mlxsw_sp->router->fib_nb.notifier_call = mlxsw_sp_router_fib_event;
|
2019-10-03 17:49:32 +08:00
|
|
|
err = register_fib_notifier(mlxsw_sp_net(mlxsw_sp),
|
|
|
|
&mlxsw_sp->router->fib_nb,
|
2019-10-03 17:49:34 +08:00
|
|
|
mlxsw_sp_router_fib_dump_flush, extack);
|
2016-12-03 23:45:07 +08:00
|
|
|
if (err)
|
|
|
|
goto err_register_fib_notifier;
|
|
|
|
|
2016-09-26 18:52:31 +08:00
|
|
|
return 0;
|
|
|
|
|
2016-12-03 23:45:07 +08:00
|
|
|
err_register_fib_notifier:
|
2018-01-14 19:33:14 +08:00
|
|
|
err_dscp_init:
|
2017-11-03 00:14:09 +08:00
|
|
|
err_mp_hash_init:
|
2017-11-03 00:14:06 +08:00
|
|
|
unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb);
|
|
|
|
err_register_netevent_notifier:
|
2016-12-03 23:45:07 +08:00
|
|
|
mlxsw_sp_neigh_fini(mlxsw_sp);
|
2016-09-26 18:52:31 +08:00
|
|
|
err_neigh_init:
|
|
|
|
mlxsw_sp_vrs_fini(mlxsw_sp);
|
|
|
|
err_vrs_init:
|
2017-09-27 14:23:20 +08:00
|
|
|
mlxsw_sp_mr_fini(mlxsw_sp);
|
|
|
|
err_mr_init:
|
2017-03-24 15:02:47 +08:00
|
|
|
mlxsw_sp_lpm_fini(mlxsw_sp);
|
|
|
|
err_lpm_init:
|
2017-05-17 01:38:25 +08:00
|
|
|
rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht);
|
2017-02-08 18:16:29 +08:00
|
|
|
err_nexthop_group_ht_init:
|
2017-05-17 01:38:25 +08:00
|
|
|
rhashtable_destroy(&mlxsw_sp->router->nexthop_ht);
|
2017-02-08 18:16:30 +08:00
|
|
|
err_nexthop_ht_init:
|
2017-09-03 05:49:17 +08:00
|
|
|
mlxsw_sp_ipips_fini(mlxsw_sp);
|
|
|
|
err_ipips_init:
|
2017-05-17 01:38:29 +08:00
|
|
|
mlxsw_sp_rifs_fini(mlxsw_sp);
|
|
|
|
err_rifs_init:
|
2016-09-26 18:52:31 +08:00
|
|
|
__mlxsw_sp_router_fini(mlxsw_sp);
|
2017-05-17 01:38:25 +08:00
|
|
|
err_router_init:
|
2018-12-19 14:08:48 +08:00
|
|
|
unregister_inet6addr_notifier(&router->inet6addr_nb);
|
|
|
|
err_register_inet6addr_notifier:
|
|
|
|
unregister_inetaddr_notifier(&router->inetaddr_nb);
|
|
|
|
err_register_inetaddr_notifier:
|
2020-02-22 01:54:09 +08:00
|
|
|
mutex_destroy(&mlxsw_sp->router->lock);
|
2017-05-17 01:38:25 +08:00
|
|
|
kfree(mlxsw_sp->router);
|
2016-09-26 18:52:31 +08:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
void mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp)
|
|
|
|
{
|
2019-10-03 17:49:32 +08:00
|
|
|
unregister_fib_notifier(mlxsw_sp_net(mlxsw_sp),
|
|
|
|
&mlxsw_sp->router->fib_nb);
|
2017-11-03 00:14:06 +08:00
|
|
|
unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb);
|
2016-09-26 18:52:31 +08:00
|
|
|
mlxsw_sp_neigh_fini(mlxsw_sp);
|
|
|
|
mlxsw_sp_vrs_fini(mlxsw_sp);
|
2017-09-27 14:23:20 +08:00
|
|
|
mlxsw_sp_mr_fini(mlxsw_sp);
|
2017-03-24 15:02:47 +08:00
|
|
|
mlxsw_sp_lpm_fini(mlxsw_sp);
|
2017-05-17 01:38:25 +08:00
|
|
|
rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht);
|
|
|
|
rhashtable_destroy(&mlxsw_sp->router->nexthop_ht);
|
2017-09-03 05:49:17 +08:00
|
|
|
mlxsw_sp_ipips_fini(mlxsw_sp);
|
2017-05-17 01:38:29 +08:00
|
|
|
mlxsw_sp_rifs_fini(mlxsw_sp);
|
2016-09-26 18:52:31 +08:00
|
|
|
__mlxsw_sp_router_fini(mlxsw_sp);
|
2018-12-19 14:08:48 +08:00
|
|
|
unregister_inet6addr_notifier(&mlxsw_sp->router->inet6addr_nb);
|
|
|
|
unregister_inetaddr_notifier(&mlxsw_sp->router->inetaddr_nb);
|
2020-02-22 01:54:09 +08:00
|
|
|
mutex_destroy(&mlxsw_sp->router->lock);
|
2017-05-17 01:38:25 +08:00
|
|
|
kfree(mlxsw_sp->router);
|
2016-09-26 18:52:31 +08:00
|
|
|
}
|