c6385c0b67
A key component of the resilient hashing algorithm is the hash buckets' activity. If a bucket is active, it will not be populated with a new nexthop in order not to break existing flows. Therefore, in order to easily and thoroughly test the algorithm, we need to be in full control over the reported activity. Add a debugfs interface that allows user space to have netdevsim report a nexthop bucket within a resilient nexthop group as active. For example: # echo 10 23 > /sys/kernel/debug/netdevsim/netdevsim10/fib/nexthop_bucket_activity Will mark bucket 23 in nexthop group 10 as active. Signed-off-by: Ido Schimmel <idosch@nvidia.com> Reviewed-by: Petr Machata <petrm@nvidia.com> Signed-off-by: Petr Machata <petrm@nvidia.com> Signed-off-by: David S. Miller <davem@davemloft.net>
1630 lines
39 KiB
C
1630 lines
39 KiB
C
/*
|
|
* Copyright (c) 2018 Cumulus Networks. All rights reserved.
|
|
* Copyright (c) 2018 David Ahern <dsa@cumulusnetworks.com>
|
|
*
|
|
* This software is licensed under the GNU General License Version 2,
|
|
* June 1991 as shown in the file COPYING in the top-level directory of this
|
|
* source tree.
|
|
*
|
|
* THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
|
|
* WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
|
|
* BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
|
|
* FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
|
|
* OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
|
|
* THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
|
|
*/
|
|
|
|
#include <linux/bitmap.h>
|
|
#include <linux/in6.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/list.h>
|
|
#include <linux/rhashtable.h>
|
|
#include <linux/spinlock_types.h>
|
|
#include <linux/types.h>
|
|
#include <net/fib_notifier.h>
|
|
#include <net/ip_fib.h>
|
|
#include <net/ip6_fib.h>
|
|
#include <net/fib_rules.h>
|
|
#include <net/net_namespace.h>
|
|
#include <net/nexthop.h>
|
|
#include <linux/debugfs.h>
|
|
|
|
#include "netdevsim.h"
|
|
|
|
struct nsim_fib_entry {
|
|
u64 max;
|
|
atomic64_t num;
|
|
};
|
|
|
|
struct nsim_per_fib_data {
|
|
struct nsim_fib_entry fib;
|
|
struct nsim_fib_entry rules;
|
|
};
|
|
|
|
struct nsim_fib_data {
|
|
struct notifier_block fib_nb;
|
|
struct nsim_per_fib_data ipv4;
|
|
struct nsim_per_fib_data ipv6;
|
|
struct nsim_fib_entry nexthops;
|
|
struct rhashtable fib_rt_ht;
|
|
struct list_head fib_rt_list;
|
|
struct mutex fib_lock; /* Protects FIB HT and list */
|
|
struct notifier_block nexthop_nb;
|
|
struct rhashtable nexthop_ht;
|
|
struct devlink *devlink;
|
|
struct work_struct fib_event_work;
|
|
struct list_head fib_event_queue;
|
|
spinlock_t fib_event_queue_lock; /* Protects fib event queue list */
|
|
struct mutex nh_lock; /* Protects NH HT */
|
|
struct dentry *ddir;
|
|
bool fail_route_offload;
|
|
bool fail_res_nexthop_group_replace;
|
|
bool fail_nexthop_bucket_replace;
|
|
};
|
|
|
|
struct nsim_fib_rt_key {
|
|
unsigned char addr[sizeof(struct in6_addr)];
|
|
unsigned char prefix_len;
|
|
int family;
|
|
u32 tb_id;
|
|
};
|
|
|
|
struct nsim_fib_rt {
|
|
struct nsim_fib_rt_key key;
|
|
struct rhash_head ht_node;
|
|
struct list_head list; /* Member of fib_rt_list */
|
|
};
|
|
|
|
struct nsim_fib4_rt {
|
|
struct nsim_fib_rt common;
|
|
struct fib_info *fi;
|
|
u8 tos;
|
|
u8 type;
|
|
};
|
|
|
|
struct nsim_fib6_rt {
|
|
struct nsim_fib_rt common;
|
|
struct list_head nh_list;
|
|
unsigned int nhs;
|
|
};
|
|
|
|
struct nsim_fib6_rt_nh {
|
|
struct list_head list; /* Member of nh_list */
|
|
struct fib6_info *rt;
|
|
};
|
|
|
|
struct nsim_fib6_event {
|
|
struct fib6_info **rt_arr;
|
|
unsigned int nrt6;
|
|
};
|
|
|
|
struct nsim_fib_event {
|
|
struct list_head list; /* node in fib queue */
|
|
union {
|
|
struct fib_entry_notifier_info fen_info;
|
|
struct nsim_fib6_event fib6_event;
|
|
};
|
|
struct nsim_fib_data *data;
|
|
unsigned long event;
|
|
int family;
|
|
};
|
|
|
|
static const struct rhashtable_params nsim_fib_rt_ht_params = {
|
|
.key_offset = offsetof(struct nsim_fib_rt, key),
|
|
.head_offset = offsetof(struct nsim_fib_rt, ht_node),
|
|
.key_len = sizeof(struct nsim_fib_rt_key),
|
|
.automatic_shrinking = true,
|
|
};
|
|
|
|
struct nsim_nexthop {
|
|
struct rhash_head ht_node;
|
|
u64 occ;
|
|
u32 id;
|
|
bool is_resilient;
|
|
};
|
|
|
|
static const struct rhashtable_params nsim_nexthop_ht_params = {
|
|
.key_offset = offsetof(struct nsim_nexthop, id),
|
|
.head_offset = offsetof(struct nsim_nexthop, ht_node),
|
|
.key_len = sizeof(u32),
|
|
.automatic_shrinking = true,
|
|
};
|
|
|
|
u64 nsim_fib_get_val(struct nsim_fib_data *fib_data,
|
|
enum nsim_resource_id res_id, bool max)
|
|
{
|
|
struct nsim_fib_entry *entry;
|
|
|
|
switch (res_id) {
|
|
case NSIM_RESOURCE_IPV4_FIB:
|
|
entry = &fib_data->ipv4.fib;
|
|
break;
|
|
case NSIM_RESOURCE_IPV4_FIB_RULES:
|
|
entry = &fib_data->ipv4.rules;
|
|
break;
|
|
case NSIM_RESOURCE_IPV6_FIB:
|
|
entry = &fib_data->ipv6.fib;
|
|
break;
|
|
case NSIM_RESOURCE_IPV6_FIB_RULES:
|
|
entry = &fib_data->ipv6.rules;
|
|
break;
|
|
case NSIM_RESOURCE_NEXTHOPS:
|
|
entry = &fib_data->nexthops;
|
|
break;
|
|
default:
|
|
return 0;
|
|
}
|
|
|
|
return max ? entry->max : atomic64_read(&entry->num);
|
|
}
|
|
|
|
static void nsim_fib_set_max(struct nsim_fib_data *fib_data,
|
|
enum nsim_resource_id res_id, u64 val)
|
|
{
|
|
struct nsim_fib_entry *entry;
|
|
|
|
switch (res_id) {
|
|
case NSIM_RESOURCE_IPV4_FIB:
|
|
entry = &fib_data->ipv4.fib;
|
|
break;
|
|
case NSIM_RESOURCE_IPV4_FIB_RULES:
|
|
entry = &fib_data->ipv4.rules;
|
|
break;
|
|
case NSIM_RESOURCE_IPV6_FIB:
|
|
entry = &fib_data->ipv6.fib;
|
|
break;
|
|
case NSIM_RESOURCE_IPV6_FIB_RULES:
|
|
entry = &fib_data->ipv6.rules;
|
|
break;
|
|
case NSIM_RESOURCE_NEXTHOPS:
|
|
entry = &fib_data->nexthops;
|
|
break;
|
|
default:
|
|
WARN_ON(1);
|
|
return;
|
|
}
|
|
entry->max = val;
|
|
}
|
|
|
|
static int nsim_fib_rule_account(struct nsim_fib_entry *entry, bool add,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
int err = 0;
|
|
|
|
if (add) {
|
|
if (!atomic64_add_unless(&entry->num, 1, entry->max)) {
|
|
err = -ENOSPC;
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported fib rule entries");
|
|
}
|
|
} else {
|
|
atomic64_dec_if_positive(&entry->num);
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
static int nsim_fib_rule_event(struct nsim_fib_data *data,
|
|
struct fib_notifier_info *info, bool add)
|
|
{
|
|
struct netlink_ext_ack *extack = info->extack;
|
|
int err = 0;
|
|
|
|
switch (info->family) {
|
|
case AF_INET:
|
|
err = nsim_fib_rule_account(&data->ipv4.rules, add, extack);
|
|
break;
|
|
case AF_INET6:
|
|
err = nsim_fib_rule_account(&data->ipv6.rules, add, extack);
|
|
break;
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
static int nsim_fib_account(struct nsim_fib_entry *entry, bool add)
|
|
{
|
|
int err = 0;
|
|
|
|
if (add) {
|
|
if (!atomic64_add_unless(&entry->num, 1, entry->max))
|
|
err = -ENOSPC;
|
|
} else {
|
|
atomic64_dec_if_positive(&entry->num);
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
static void nsim_fib_rt_init(struct nsim_fib_data *data,
|
|
struct nsim_fib_rt *fib_rt, const void *addr,
|
|
size_t addr_len, unsigned int prefix_len,
|
|
int family, u32 tb_id)
|
|
{
|
|
memcpy(fib_rt->key.addr, addr, addr_len);
|
|
fib_rt->key.prefix_len = prefix_len;
|
|
fib_rt->key.family = family;
|
|
fib_rt->key.tb_id = tb_id;
|
|
list_add(&fib_rt->list, &data->fib_rt_list);
|
|
}
|
|
|
|
static void nsim_fib_rt_fini(struct nsim_fib_rt *fib_rt)
|
|
{
|
|
list_del(&fib_rt->list);
|
|
}
|
|
|
|
static struct nsim_fib_rt *nsim_fib_rt_lookup(struct rhashtable *fib_rt_ht,
|
|
const void *addr, size_t addr_len,
|
|
unsigned int prefix_len,
|
|
int family, u32 tb_id)
|
|
{
|
|
struct nsim_fib_rt_key key;
|
|
|
|
memset(&key, 0, sizeof(key));
|
|
memcpy(key.addr, addr, addr_len);
|
|
key.prefix_len = prefix_len;
|
|
key.family = family;
|
|
key.tb_id = tb_id;
|
|
|
|
return rhashtable_lookup_fast(fib_rt_ht, &key, nsim_fib_rt_ht_params);
|
|
}
|
|
|
|
static struct nsim_fib4_rt *
|
|
nsim_fib4_rt_create(struct nsim_fib_data *data,
|
|
struct fib_entry_notifier_info *fen_info)
|
|
{
|
|
struct nsim_fib4_rt *fib4_rt;
|
|
|
|
fib4_rt = kzalloc(sizeof(*fib4_rt), GFP_KERNEL);
|
|
if (!fib4_rt)
|
|
return NULL;
|
|
|
|
nsim_fib_rt_init(data, &fib4_rt->common, &fen_info->dst, sizeof(u32),
|
|
fen_info->dst_len, AF_INET, fen_info->tb_id);
|
|
|
|
fib4_rt->fi = fen_info->fi;
|
|
fib_info_hold(fib4_rt->fi);
|
|
fib4_rt->tos = fen_info->tos;
|
|
fib4_rt->type = fen_info->type;
|
|
|
|
return fib4_rt;
|
|
}
|
|
|
|
static void nsim_fib4_rt_destroy(struct nsim_fib4_rt *fib4_rt)
|
|
{
|
|
fib_info_put(fib4_rt->fi);
|
|
nsim_fib_rt_fini(&fib4_rt->common);
|
|
kfree(fib4_rt);
|
|
}
|
|
|
|
static struct nsim_fib4_rt *
|
|
nsim_fib4_rt_lookup(struct rhashtable *fib_rt_ht,
|
|
const struct fib_entry_notifier_info *fen_info)
|
|
{
|
|
struct nsim_fib_rt *fib_rt;
|
|
|
|
fib_rt = nsim_fib_rt_lookup(fib_rt_ht, &fen_info->dst, sizeof(u32),
|
|
fen_info->dst_len, AF_INET,
|
|
fen_info->tb_id);
|
|
if (!fib_rt)
|
|
return NULL;
|
|
|
|
return container_of(fib_rt, struct nsim_fib4_rt, common);
|
|
}
|
|
|
|
static void
|
|
nsim_fib4_rt_offload_failed_flag_set(struct net *net,
|
|
struct fib_entry_notifier_info *fen_info)
|
|
{
|
|
u32 *p_dst = (u32 *)&fen_info->dst;
|
|
struct fib_rt_info fri;
|
|
|
|
fri.fi = fen_info->fi;
|
|
fri.tb_id = fen_info->tb_id;
|
|
fri.dst = cpu_to_be32(*p_dst);
|
|
fri.dst_len = fen_info->dst_len;
|
|
fri.tos = fen_info->tos;
|
|
fri.type = fen_info->type;
|
|
fri.offload = false;
|
|
fri.trap = false;
|
|
fri.offload_failed = true;
|
|
fib_alias_hw_flags_set(net, &fri);
|
|
}
|
|
|
|
static void nsim_fib4_rt_hw_flags_set(struct net *net,
|
|
const struct nsim_fib4_rt *fib4_rt,
|
|
bool trap)
|
|
{
|
|
u32 *p_dst = (u32 *) fib4_rt->common.key.addr;
|
|
int dst_len = fib4_rt->common.key.prefix_len;
|
|
struct fib_rt_info fri;
|
|
|
|
fri.fi = fib4_rt->fi;
|
|
fri.tb_id = fib4_rt->common.key.tb_id;
|
|
fri.dst = cpu_to_be32(*p_dst);
|
|
fri.dst_len = dst_len;
|
|
fri.tos = fib4_rt->tos;
|
|
fri.type = fib4_rt->type;
|
|
fri.offload = false;
|
|
fri.trap = trap;
|
|
fri.offload_failed = false;
|
|
fib_alias_hw_flags_set(net, &fri);
|
|
}
|
|
|
|
static int nsim_fib4_rt_add(struct nsim_fib_data *data,
|
|
struct nsim_fib4_rt *fib4_rt)
|
|
{
|
|
struct net *net = devlink_net(data->devlink);
|
|
int err;
|
|
|
|
err = rhashtable_insert_fast(&data->fib_rt_ht,
|
|
&fib4_rt->common.ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
if (err)
|
|
goto err_fib_dismiss;
|
|
|
|
/* Simulate hardware programming latency. */
|
|
msleep(1);
|
|
nsim_fib4_rt_hw_flags_set(net, fib4_rt, true);
|
|
|
|
return 0;
|
|
|
|
err_fib_dismiss:
|
|
/* Drop the accounting that was increased from the notification
|
|
* context when FIB_EVENT_ENTRY_REPLACE was triggered.
|
|
*/
|
|
nsim_fib_account(&data->ipv4.fib, false);
|
|
return err;
|
|
}
|
|
|
|
static int nsim_fib4_rt_replace(struct nsim_fib_data *data,
|
|
struct nsim_fib4_rt *fib4_rt,
|
|
struct nsim_fib4_rt *fib4_rt_old)
|
|
{
|
|
struct net *net = devlink_net(data->devlink);
|
|
int err;
|
|
|
|
/* We are replacing a route, so need to remove the accounting which
|
|
* was increased when FIB_EVENT_ENTRY_REPLACE was triggered.
|
|
*/
|
|
err = nsim_fib_account(&data->ipv4.fib, false);
|
|
if (err)
|
|
return err;
|
|
err = rhashtable_replace_fast(&data->fib_rt_ht,
|
|
&fib4_rt_old->common.ht_node,
|
|
&fib4_rt->common.ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
if (err)
|
|
return err;
|
|
|
|
msleep(1);
|
|
nsim_fib4_rt_hw_flags_set(net, fib4_rt, true);
|
|
|
|
nsim_fib4_rt_hw_flags_set(net, fib4_rt_old, false);
|
|
nsim_fib4_rt_destroy(fib4_rt_old);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int nsim_fib4_rt_insert(struct nsim_fib_data *data,
|
|
struct fib_entry_notifier_info *fen_info)
|
|
{
|
|
struct nsim_fib4_rt *fib4_rt, *fib4_rt_old;
|
|
int err;
|
|
|
|
if (data->fail_route_offload) {
|
|
/* For testing purposes, user set debugfs fail_route_offload
|
|
* value to true. Simulate hardware programming latency and then
|
|
* fail.
|
|
*/
|
|
msleep(1);
|
|
return -EINVAL;
|
|
}
|
|
|
|
fib4_rt = nsim_fib4_rt_create(data, fen_info);
|
|
if (!fib4_rt)
|
|
return -ENOMEM;
|
|
|
|
fib4_rt_old = nsim_fib4_rt_lookup(&data->fib_rt_ht, fen_info);
|
|
if (!fib4_rt_old)
|
|
err = nsim_fib4_rt_add(data, fib4_rt);
|
|
else
|
|
err = nsim_fib4_rt_replace(data, fib4_rt, fib4_rt_old);
|
|
|
|
if (err)
|
|
nsim_fib4_rt_destroy(fib4_rt);
|
|
|
|
return err;
|
|
}
|
|
|
|
static void nsim_fib4_rt_remove(struct nsim_fib_data *data,
|
|
const struct fib_entry_notifier_info *fen_info)
|
|
{
|
|
struct nsim_fib4_rt *fib4_rt;
|
|
|
|
fib4_rt = nsim_fib4_rt_lookup(&data->fib_rt_ht, fen_info);
|
|
if (!fib4_rt)
|
|
return;
|
|
|
|
rhashtable_remove_fast(&data->fib_rt_ht, &fib4_rt->common.ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
nsim_fib4_rt_destroy(fib4_rt);
|
|
}
|
|
|
|
static int nsim_fib4_event(struct nsim_fib_data *data,
|
|
struct fib_entry_notifier_info *fen_info,
|
|
unsigned long event)
|
|
{
|
|
int err = 0;
|
|
|
|
switch (event) {
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
|
err = nsim_fib4_rt_insert(data, fen_info);
|
|
if (err) {
|
|
struct net *net = devlink_net(data->devlink);
|
|
|
|
nsim_fib4_rt_offload_failed_flag_set(net, fen_info);
|
|
}
|
|
break;
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
nsim_fib4_rt_remove(data, fen_info);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
static struct nsim_fib6_rt_nh *
|
|
nsim_fib6_rt_nh_find(const struct nsim_fib6_rt *fib6_rt,
|
|
const struct fib6_info *rt)
|
|
{
|
|
struct nsim_fib6_rt_nh *fib6_rt_nh;
|
|
|
|
list_for_each_entry(fib6_rt_nh, &fib6_rt->nh_list, list) {
|
|
if (fib6_rt_nh->rt == rt)
|
|
return fib6_rt_nh;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
static int nsim_fib6_rt_nh_add(struct nsim_fib6_rt *fib6_rt,
|
|
struct fib6_info *rt)
|
|
{
|
|
struct nsim_fib6_rt_nh *fib6_rt_nh;
|
|
|
|
fib6_rt_nh = kzalloc(sizeof(*fib6_rt_nh), GFP_KERNEL);
|
|
if (!fib6_rt_nh)
|
|
return -ENOMEM;
|
|
|
|
fib6_info_hold(rt);
|
|
fib6_rt_nh->rt = rt;
|
|
list_add_tail(&fib6_rt_nh->list, &fib6_rt->nh_list);
|
|
fib6_rt->nhs++;
|
|
|
|
return 0;
|
|
}
|
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
|
static void nsim_rt6_release(struct fib6_info *rt)
|
|
{
|
|
fib6_info_release(rt);
|
|
}
|
|
#else
|
|
static void nsim_rt6_release(struct fib6_info *rt)
|
|
{
|
|
}
|
|
#endif
|
|
|
|
static void nsim_fib6_rt_nh_del(struct nsim_fib6_rt *fib6_rt,
|
|
const struct fib6_info *rt)
|
|
{
|
|
struct nsim_fib6_rt_nh *fib6_rt_nh;
|
|
|
|
fib6_rt_nh = nsim_fib6_rt_nh_find(fib6_rt, rt);
|
|
if (!fib6_rt_nh)
|
|
return;
|
|
|
|
fib6_rt->nhs--;
|
|
list_del(&fib6_rt_nh->list);
|
|
nsim_rt6_release(fib6_rt_nh->rt);
|
|
kfree(fib6_rt_nh);
|
|
}
|
|
|
|
static struct nsim_fib6_rt *
|
|
nsim_fib6_rt_create(struct nsim_fib_data *data,
|
|
struct fib6_info **rt_arr, unsigned int nrt6)
|
|
{
|
|
struct fib6_info *rt = rt_arr[0];
|
|
struct nsim_fib6_rt *fib6_rt;
|
|
int i = 0;
|
|
int err;
|
|
|
|
fib6_rt = kzalloc(sizeof(*fib6_rt), GFP_KERNEL);
|
|
if (!fib6_rt)
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
nsim_fib_rt_init(data, &fib6_rt->common, &rt->fib6_dst.addr,
|
|
sizeof(rt->fib6_dst.addr), rt->fib6_dst.plen, AF_INET6,
|
|
rt->fib6_table->tb6_id);
|
|
|
|
/* We consider a multipath IPv6 route as one entry, but it can be made
|
|
* up from several fib6_info structs (one for each nexthop), so we
|
|
* add them all to the same list under the entry.
|
|
*/
|
|
INIT_LIST_HEAD(&fib6_rt->nh_list);
|
|
|
|
for (i = 0; i < nrt6; i++) {
|
|
err = nsim_fib6_rt_nh_add(fib6_rt, rt_arr[i]);
|
|
if (err)
|
|
goto err_fib6_rt_nh_del;
|
|
}
|
|
|
|
return fib6_rt;
|
|
|
|
err_fib6_rt_nh_del:
|
|
for (i--; i >= 0; i--) {
|
|
nsim_fib6_rt_nh_del(fib6_rt, rt_arr[i]);
|
|
};
|
|
nsim_fib_rt_fini(&fib6_rt->common);
|
|
kfree(fib6_rt);
|
|
return ERR_PTR(err);
|
|
}
|
|
|
|
static void nsim_fib6_rt_destroy(struct nsim_fib6_rt *fib6_rt)
|
|
{
|
|
struct nsim_fib6_rt_nh *iter, *tmp;
|
|
|
|
list_for_each_entry_safe(iter, tmp, &fib6_rt->nh_list, list)
|
|
nsim_fib6_rt_nh_del(fib6_rt, iter->rt);
|
|
WARN_ON_ONCE(!list_empty(&fib6_rt->nh_list));
|
|
nsim_fib_rt_fini(&fib6_rt->common);
|
|
kfree(fib6_rt);
|
|
}
|
|
|
|
static struct nsim_fib6_rt *
|
|
nsim_fib6_rt_lookup(struct rhashtable *fib_rt_ht, const struct fib6_info *rt)
|
|
{
|
|
struct nsim_fib_rt *fib_rt;
|
|
|
|
fib_rt = nsim_fib_rt_lookup(fib_rt_ht, &rt->fib6_dst.addr,
|
|
sizeof(rt->fib6_dst.addr),
|
|
rt->fib6_dst.plen, AF_INET6,
|
|
rt->fib6_table->tb6_id);
|
|
if (!fib_rt)
|
|
return NULL;
|
|
|
|
return container_of(fib_rt, struct nsim_fib6_rt, common);
|
|
}
|
|
|
|
static int nsim_fib6_rt_append(struct nsim_fib_data *data,
|
|
struct nsim_fib6_event *fib6_event)
|
|
{
|
|
struct fib6_info *rt = fib6_event->rt_arr[0];
|
|
struct nsim_fib6_rt *fib6_rt;
|
|
int i, err;
|
|
|
|
if (data->fail_route_offload) {
|
|
/* For testing purposes, user set debugfs fail_route_offload
|
|
* value to true. Simulate hardware programming latency and then
|
|
* fail.
|
|
*/
|
|
msleep(1);
|
|
return -EINVAL;
|
|
}
|
|
|
|
fib6_rt = nsim_fib6_rt_lookup(&data->fib_rt_ht, rt);
|
|
if (!fib6_rt)
|
|
return -EINVAL;
|
|
|
|
for (i = 0; i < fib6_event->nrt6; i++) {
|
|
err = nsim_fib6_rt_nh_add(fib6_rt, fib6_event->rt_arr[i]);
|
|
if (err)
|
|
goto err_fib6_rt_nh_del;
|
|
|
|
fib6_event->rt_arr[i]->trap = true;
|
|
}
|
|
|
|
return 0;
|
|
|
|
err_fib6_rt_nh_del:
|
|
for (i--; i >= 0; i--) {
|
|
fib6_event->rt_arr[i]->trap = false;
|
|
nsim_fib6_rt_nh_del(fib6_rt, fib6_event->rt_arr[i]);
|
|
}
|
|
return err;
|
|
}
|
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
|
static void nsim_fib6_rt_offload_failed_flag_set(struct nsim_fib_data *data,
|
|
struct fib6_info **rt_arr,
|
|
unsigned int nrt6)
|
|
|
|
{
|
|
struct net *net = devlink_net(data->devlink);
|
|
int i;
|
|
|
|
for (i = 0; i < nrt6; i++)
|
|
fib6_info_hw_flags_set(net, rt_arr[i], false, false, true);
|
|
}
|
|
#else
|
|
static void nsim_fib6_rt_offload_failed_flag_set(struct nsim_fib_data *data,
|
|
struct fib6_info **rt_arr,
|
|
unsigned int nrt6)
|
|
{
|
|
}
|
|
#endif
|
|
|
|
#if IS_ENABLED(CONFIG_IPV6)
|
|
static void nsim_fib6_rt_hw_flags_set(struct nsim_fib_data *data,
|
|
const struct nsim_fib6_rt *fib6_rt,
|
|
bool trap)
|
|
{
|
|
struct net *net = devlink_net(data->devlink);
|
|
struct nsim_fib6_rt_nh *fib6_rt_nh;
|
|
|
|
list_for_each_entry(fib6_rt_nh, &fib6_rt->nh_list, list)
|
|
fib6_info_hw_flags_set(net, fib6_rt_nh->rt, false, trap, false);
|
|
}
|
|
#else
|
|
static void nsim_fib6_rt_hw_flags_set(struct nsim_fib_data *data,
|
|
const struct nsim_fib6_rt *fib6_rt,
|
|
bool trap)
|
|
{
|
|
}
|
|
#endif
|
|
|
|
static int nsim_fib6_rt_add(struct nsim_fib_data *data,
|
|
struct nsim_fib6_rt *fib6_rt)
|
|
{
|
|
int err;
|
|
|
|
err = rhashtable_insert_fast(&data->fib_rt_ht,
|
|
&fib6_rt->common.ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
|
|
if (err)
|
|
goto err_fib_dismiss;
|
|
|
|
msleep(1);
|
|
nsim_fib6_rt_hw_flags_set(data, fib6_rt, true);
|
|
|
|
return 0;
|
|
|
|
err_fib_dismiss:
|
|
/* Drop the accounting that was increased from the notification
|
|
* context when FIB_EVENT_ENTRY_REPLACE was triggered.
|
|
*/
|
|
nsim_fib_account(&data->ipv6.fib, false);
|
|
return err;
|
|
}
|
|
|
|
static int nsim_fib6_rt_replace(struct nsim_fib_data *data,
|
|
struct nsim_fib6_rt *fib6_rt,
|
|
struct nsim_fib6_rt *fib6_rt_old)
|
|
{
|
|
int err;
|
|
|
|
/* We are replacing a route, so need to remove the accounting which
|
|
* was increased when FIB_EVENT_ENTRY_REPLACE was triggered.
|
|
*/
|
|
err = nsim_fib_account(&data->ipv6.fib, false);
|
|
if (err)
|
|
return err;
|
|
|
|
err = rhashtable_replace_fast(&data->fib_rt_ht,
|
|
&fib6_rt_old->common.ht_node,
|
|
&fib6_rt->common.ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
|
|
if (err)
|
|
return err;
|
|
|
|
msleep(1);
|
|
nsim_fib6_rt_hw_flags_set(data, fib6_rt, true);
|
|
|
|
nsim_fib6_rt_hw_flags_set(data, fib6_rt_old, false);
|
|
nsim_fib6_rt_destroy(fib6_rt_old);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int nsim_fib6_rt_insert(struct nsim_fib_data *data,
|
|
struct nsim_fib6_event *fib6_event)
|
|
{
|
|
struct fib6_info *rt = fib6_event->rt_arr[0];
|
|
struct nsim_fib6_rt *fib6_rt, *fib6_rt_old;
|
|
int err;
|
|
|
|
if (data->fail_route_offload) {
|
|
/* For testing purposes, user set debugfs fail_route_offload
|
|
* value to true. Simulate hardware programming latency and then
|
|
* fail.
|
|
*/
|
|
msleep(1);
|
|
return -EINVAL;
|
|
}
|
|
|
|
fib6_rt = nsim_fib6_rt_create(data, fib6_event->rt_arr,
|
|
fib6_event->nrt6);
|
|
if (IS_ERR(fib6_rt))
|
|
return PTR_ERR(fib6_rt);
|
|
|
|
fib6_rt_old = nsim_fib6_rt_lookup(&data->fib_rt_ht, rt);
|
|
if (!fib6_rt_old)
|
|
err = nsim_fib6_rt_add(data, fib6_rt);
|
|
else
|
|
err = nsim_fib6_rt_replace(data, fib6_rt, fib6_rt_old);
|
|
|
|
if (err)
|
|
nsim_fib6_rt_destroy(fib6_rt);
|
|
|
|
return err;
|
|
}
|
|
|
|
static void nsim_fib6_rt_remove(struct nsim_fib_data *data,
|
|
struct nsim_fib6_event *fib6_event)
|
|
{
|
|
struct fib6_info *rt = fib6_event->rt_arr[0];
|
|
struct nsim_fib6_rt *fib6_rt;
|
|
int i;
|
|
|
|
/* Multipath routes are first added to the FIB trie and only then
|
|
* notified. If we vetoed the addition, we will get a delete
|
|
* notification for a route we do not have. Therefore, do not warn if
|
|
* route was not found.
|
|
*/
|
|
fib6_rt = nsim_fib6_rt_lookup(&data->fib_rt_ht, rt);
|
|
if (!fib6_rt)
|
|
return;
|
|
|
|
/* If not all the nexthops are deleted, then only reduce the nexthop
|
|
* group.
|
|
*/
|
|
if (fib6_event->nrt6 != fib6_rt->nhs) {
|
|
for (i = 0; i < fib6_event->nrt6; i++)
|
|
nsim_fib6_rt_nh_del(fib6_rt, fib6_event->rt_arr[i]);
|
|
return;
|
|
}
|
|
|
|
rhashtable_remove_fast(&data->fib_rt_ht, &fib6_rt->common.ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
nsim_fib6_rt_destroy(fib6_rt);
|
|
}
|
|
|
|
static int nsim_fib6_event_init(struct nsim_fib6_event *fib6_event,
|
|
struct fib6_entry_notifier_info *fen6_info)
|
|
{
|
|
struct fib6_info *rt = fen6_info->rt;
|
|
struct fib6_info **rt_arr;
|
|
struct fib6_info *iter;
|
|
unsigned int nrt6;
|
|
int i = 0;
|
|
|
|
nrt6 = fen6_info->nsiblings + 1;
|
|
|
|
rt_arr = kcalloc(nrt6, sizeof(struct fib6_info *), GFP_ATOMIC);
|
|
if (!rt_arr)
|
|
return -ENOMEM;
|
|
|
|
fib6_event->rt_arr = rt_arr;
|
|
fib6_event->nrt6 = nrt6;
|
|
|
|
rt_arr[0] = rt;
|
|
fib6_info_hold(rt);
|
|
|
|
if (!fen6_info->nsiblings)
|
|
return 0;
|
|
|
|
list_for_each_entry(iter, &rt->fib6_siblings, fib6_siblings) {
|
|
if (i == fen6_info->nsiblings)
|
|
break;
|
|
|
|
rt_arr[i + 1] = iter;
|
|
fib6_info_hold(iter);
|
|
i++;
|
|
}
|
|
WARN_ON_ONCE(i != fen6_info->nsiblings);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void nsim_fib6_event_fini(struct nsim_fib6_event *fib6_event)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < fib6_event->nrt6; i++)
|
|
nsim_rt6_release(fib6_event->rt_arr[i]);
|
|
kfree(fib6_event->rt_arr);
|
|
}
|
|
|
|
static int nsim_fib6_event(struct nsim_fib_data *data,
|
|
struct nsim_fib6_event *fib6_event,
|
|
unsigned long event)
|
|
{
|
|
int err;
|
|
|
|
if (fib6_event->rt_arr[0]->fib6_src.plen)
|
|
return 0;
|
|
|
|
switch (event) {
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
|
err = nsim_fib6_rt_insert(data, fib6_event);
|
|
if (err)
|
|
goto err_rt_offload_failed_flag_set;
|
|
break;
|
|
case FIB_EVENT_ENTRY_APPEND:
|
|
err = nsim_fib6_rt_append(data, fib6_event);
|
|
if (err)
|
|
goto err_rt_offload_failed_flag_set;
|
|
break;
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
nsim_fib6_rt_remove(data, fib6_event);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
return 0;
|
|
|
|
err_rt_offload_failed_flag_set:
|
|
nsim_fib6_rt_offload_failed_flag_set(data, fib6_event->rt_arr,
|
|
fib6_event->nrt6);
|
|
return err;
|
|
}
|
|
|
|
static void nsim_fib_event(struct nsim_fib_event *fib_event)
|
|
{
|
|
switch (fib_event->family) {
|
|
case AF_INET:
|
|
nsim_fib4_event(fib_event->data, &fib_event->fen_info,
|
|
fib_event->event);
|
|
fib_info_put(fib_event->fen_info.fi);
|
|
break;
|
|
case AF_INET6:
|
|
nsim_fib6_event(fib_event->data, &fib_event->fib6_event,
|
|
fib_event->event);
|
|
nsim_fib6_event_fini(&fib_event->fib6_event);
|
|
break;
|
|
}
|
|
}
|
|
|
|
static int nsim_fib4_prepare_event(struct fib_notifier_info *info,
|
|
struct nsim_fib_event *fib_event,
|
|
unsigned long event)
|
|
{
|
|
struct nsim_fib_data *data = fib_event->data;
|
|
struct fib_entry_notifier_info *fen_info;
|
|
struct netlink_ext_ack *extack;
|
|
int err = 0;
|
|
|
|
fen_info = container_of(info, struct fib_entry_notifier_info,
|
|
info);
|
|
fib_event->fen_info = *fen_info;
|
|
extack = info->extack;
|
|
|
|
switch (event) {
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
|
err = nsim_fib_account(&data->ipv4.fib, true);
|
|
if (err) {
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported fib entries");
|
|
return err;
|
|
}
|
|
break;
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
nsim_fib_account(&data->ipv4.fib, false);
|
|
break;
|
|
}
|
|
|
|
/* Take reference on fib_info to prevent it from being
|
|
* freed while event is queued. Release it afterwards.
|
|
*/
|
|
fib_info_hold(fib_event->fen_info.fi);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int nsim_fib6_prepare_event(struct fib_notifier_info *info,
|
|
struct nsim_fib_event *fib_event,
|
|
unsigned long event)
|
|
{
|
|
struct nsim_fib_data *data = fib_event->data;
|
|
struct fib6_entry_notifier_info *fen6_info;
|
|
struct netlink_ext_ack *extack;
|
|
int err = 0;
|
|
|
|
fen6_info = container_of(info, struct fib6_entry_notifier_info,
|
|
info);
|
|
|
|
err = nsim_fib6_event_init(&fib_event->fib6_event, fen6_info);
|
|
if (err)
|
|
return err;
|
|
|
|
extack = info->extack;
|
|
switch (event) {
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
|
err = nsim_fib_account(&data->ipv6.fib, true);
|
|
if (err) {
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported fib entries");
|
|
goto err_fib6_event_fini;
|
|
}
|
|
break;
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
nsim_fib_account(&data->ipv6.fib, false);
|
|
break;
|
|
}
|
|
|
|
return 0;
|
|
|
|
err_fib6_event_fini:
|
|
nsim_fib6_event_fini(&fib_event->fib6_event);
|
|
return err;
|
|
}
|
|
|
|
static int nsim_fib_event_schedule_work(struct nsim_fib_data *data,
|
|
struct fib_notifier_info *info,
|
|
unsigned long event)
|
|
{
|
|
struct nsim_fib_event *fib_event;
|
|
int err;
|
|
|
|
if (info->family != AF_INET && info->family != AF_INET6)
|
|
/* netdevsim does not support 'RTNL_FAMILY_IP6MR' and
|
|
* 'RTNL_FAMILY_IPMR' and should ignore them.
|
|
*/
|
|
return NOTIFY_DONE;
|
|
|
|
fib_event = kzalloc(sizeof(*fib_event), GFP_ATOMIC);
|
|
if (!fib_event)
|
|
return NOTIFY_BAD;
|
|
|
|
fib_event->data = data;
|
|
fib_event->event = event;
|
|
fib_event->family = info->family;
|
|
|
|
switch (info->family) {
|
|
case AF_INET:
|
|
err = nsim_fib4_prepare_event(info, fib_event, event);
|
|
break;
|
|
case AF_INET6:
|
|
err = nsim_fib6_prepare_event(info, fib_event, event);
|
|
break;
|
|
}
|
|
|
|
if (err)
|
|
goto err_fib_prepare_event;
|
|
|
|
/* Enqueue the event and trigger the work */
|
|
spin_lock_bh(&data->fib_event_queue_lock);
|
|
list_add_tail(&fib_event->list, &data->fib_event_queue);
|
|
spin_unlock_bh(&data->fib_event_queue_lock);
|
|
schedule_work(&data->fib_event_work);
|
|
|
|
return NOTIFY_DONE;
|
|
|
|
err_fib_prepare_event:
|
|
kfree(fib_event);
|
|
return NOTIFY_BAD;
|
|
}
|
|
|
|
static int nsim_fib_event_nb(struct notifier_block *nb, unsigned long event,
|
|
void *ptr)
|
|
{
|
|
struct nsim_fib_data *data = container_of(nb, struct nsim_fib_data,
|
|
fib_nb);
|
|
struct fib_notifier_info *info = ptr;
|
|
int err;
|
|
|
|
switch (event) {
|
|
case FIB_EVENT_RULE_ADD:
|
|
case FIB_EVENT_RULE_DEL:
|
|
err = nsim_fib_rule_event(data, info,
|
|
event == FIB_EVENT_RULE_ADD);
|
|
return notifier_from_errno(err);
|
|
case FIB_EVENT_ENTRY_REPLACE:
|
|
case FIB_EVENT_ENTRY_APPEND:
|
|
case FIB_EVENT_ENTRY_DEL:
|
|
return nsim_fib_event_schedule_work(data, info, event);
|
|
}
|
|
|
|
return NOTIFY_DONE;
|
|
}
|
|
|
|
static void nsim_fib4_rt_free(struct nsim_fib_rt *fib_rt,
|
|
struct nsim_fib_data *data)
|
|
{
|
|
struct devlink *devlink = data->devlink;
|
|
struct nsim_fib4_rt *fib4_rt;
|
|
|
|
fib4_rt = container_of(fib_rt, struct nsim_fib4_rt, common);
|
|
nsim_fib4_rt_hw_flags_set(devlink_net(devlink), fib4_rt, false);
|
|
nsim_fib_account(&data->ipv4.fib, false);
|
|
nsim_fib4_rt_destroy(fib4_rt);
|
|
}
|
|
|
|
static void nsim_fib6_rt_free(struct nsim_fib_rt *fib_rt,
|
|
struct nsim_fib_data *data)
|
|
{
|
|
struct nsim_fib6_rt *fib6_rt;
|
|
|
|
fib6_rt = container_of(fib_rt, struct nsim_fib6_rt, common);
|
|
nsim_fib6_rt_hw_flags_set(data, fib6_rt, false);
|
|
nsim_fib_account(&data->ipv6.fib, false);
|
|
nsim_fib6_rt_destroy(fib6_rt);
|
|
}
|
|
|
|
static void nsim_fib_rt_free(void *ptr, void *arg)
|
|
{
|
|
struct nsim_fib_rt *fib_rt = ptr;
|
|
struct nsim_fib_data *data = arg;
|
|
|
|
switch (fib_rt->key.family) {
|
|
case AF_INET:
|
|
nsim_fib4_rt_free(fib_rt, data);
|
|
break;
|
|
case AF_INET6:
|
|
nsim_fib6_rt_free(fib_rt, data);
|
|
break;
|
|
default:
|
|
WARN_ON_ONCE(1);
|
|
}
|
|
}
|
|
|
|
/* inconsistent dump, trying again */
|
|
static void nsim_fib_dump_inconsistent(struct notifier_block *nb)
|
|
{
|
|
struct nsim_fib_data *data = container_of(nb, struct nsim_fib_data,
|
|
fib_nb);
|
|
struct nsim_fib_rt *fib_rt, *fib_rt_tmp;
|
|
|
|
/* Flush the work to make sure there is no race with notifications. */
|
|
flush_work(&data->fib_event_work);
|
|
|
|
/* The notifier block is still not registered, so we do not need to
|
|
* take any locks here.
|
|
*/
|
|
list_for_each_entry_safe(fib_rt, fib_rt_tmp, &data->fib_rt_list, list) {
|
|
rhashtable_remove_fast(&data->fib_rt_ht, &fib_rt->ht_node,
|
|
nsim_fib_rt_ht_params);
|
|
nsim_fib_rt_free(fib_rt, data);
|
|
}
|
|
|
|
atomic64_set(&data->ipv4.rules.num, 0ULL);
|
|
atomic64_set(&data->ipv6.rules.num, 0ULL);
|
|
}
|
|
|
|
static struct nsim_nexthop *nsim_nexthop_create(struct nsim_fib_data *data,
|
|
struct nh_notifier_info *info)
|
|
{
|
|
struct nsim_nexthop *nexthop;
|
|
u64 occ = 0;
|
|
int i;
|
|
|
|
nexthop = kzalloc(sizeof(*nexthop), GFP_KERNEL);
|
|
if (!nexthop)
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
nexthop->id = info->id;
|
|
|
|
/* Determine the number of nexthop entries the new nexthop will
|
|
* occupy.
|
|
*/
|
|
|
|
switch (info->type) {
|
|
case NH_NOTIFIER_INFO_TYPE_SINGLE:
|
|
occ = 1;
|
|
break;
|
|
case NH_NOTIFIER_INFO_TYPE_GRP:
|
|
for (i = 0; i < info->nh_grp->num_nh; i++)
|
|
occ += info->nh_grp->nh_entries[i].weight;
|
|
break;
|
|
case NH_NOTIFIER_INFO_TYPE_RES_TABLE:
|
|
occ = info->nh_res_table->num_nh_buckets;
|
|
nexthop->is_resilient = true;
|
|
break;
|
|
default:
|
|
NL_SET_ERR_MSG_MOD(info->extack, "Unsupported nexthop type");
|
|
kfree(nexthop);
|
|
return ERR_PTR(-EOPNOTSUPP);
|
|
}
|
|
|
|
nexthop->occ = occ;
|
|
return nexthop;
|
|
}
|
|
|
|
static void nsim_nexthop_destroy(struct nsim_nexthop *nexthop)
|
|
{
|
|
kfree(nexthop);
|
|
}
|
|
|
|
static int nsim_nexthop_account(struct nsim_fib_data *data, u64 occ,
|
|
bool add, struct netlink_ext_ack *extack)
|
|
{
|
|
int i, err = 0;
|
|
|
|
if (add) {
|
|
for (i = 0; i < occ; i++)
|
|
if (!atomic64_add_unless(&data->nexthops.num, 1,
|
|
data->nexthops.max)) {
|
|
err = -ENOSPC;
|
|
NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported nexthops");
|
|
goto err_num_decrease;
|
|
}
|
|
} else {
|
|
if (WARN_ON(occ > atomic64_read(&data->nexthops.num)))
|
|
return -EINVAL;
|
|
atomic64_sub(occ, &data->nexthops.num);
|
|
}
|
|
|
|
return err;
|
|
|
|
err_num_decrease:
|
|
atomic64_sub(i, &data->nexthops.num);
|
|
return err;
|
|
|
|
}
|
|
|
|
static void nsim_nexthop_hw_flags_set(struct net *net,
|
|
const struct nsim_nexthop *nexthop,
|
|
bool trap)
|
|
{
|
|
int i;
|
|
|
|
nexthop_set_hw_flags(net, nexthop->id, false, trap);
|
|
|
|
if (!nexthop->is_resilient)
|
|
return;
|
|
|
|
for (i = 0; i < nexthop->occ; i++)
|
|
nexthop_bucket_set_hw_flags(net, nexthop->id, i, false, trap);
|
|
}
|
|
|
|
static int nsim_nexthop_add(struct nsim_fib_data *data,
|
|
struct nsim_nexthop *nexthop,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
struct net *net = devlink_net(data->devlink);
|
|
int err;
|
|
|
|
err = nsim_nexthop_account(data, nexthop->occ, true, extack);
|
|
if (err)
|
|
return err;
|
|
|
|
err = rhashtable_insert_fast(&data->nexthop_ht, &nexthop->ht_node,
|
|
nsim_nexthop_ht_params);
|
|
if (err) {
|
|
NL_SET_ERR_MSG_MOD(extack, "Failed to insert nexthop");
|
|
goto err_nexthop_dismiss;
|
|
}
|
|
|
|
nsim_nexthop_hw_flags_set(net, nexthop, true);
|
|
|
|
return 0;
|
|
|
|
err_nexthop_dismiss:
|
|
nsim_nexthop_account(data, nexthop->occ, false, extack);
|
|
return err;
|
|
}
|
|
|
|
static int nsim_nexthop_replace(struct nsim_fib_data *data,
|
|
struct nsim_nexthop *nexthop,
|
|
struct nsim_nexthop *nexthop_old,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
struct net *net = devlink_net(data->devlink);
|
|
int err;
|
|
|
|
err = nsim_nexthop_account(data, nexthop->occ, true, extack);
|
|
if (err)
|
|
return err;
|
|
|
|
err = rhashtable_replace_fast(&data->nexthop_ht,
|
|
&nexthop_old->ht_node, &nexthop->ht_node,
|
|
nsim_nexthop_ht_params);
|
|
if (err) {
|
|
NL_SET_ERR_MSG_MOD(extack, "Failed to replace nexthop");
|
|
goto err_nexthop_dismiss;
|
|
}
|
|
|
|
nsim_nexthop_hw_flags_set(net, nexthop, true);
|
|
nsim_nexthop_account(data, nexthop_old->occ, false, extack);
|
|
nsim_nexthop_destroy(nexthop_old);
|
|
|
|
return 0;
|
|
|
|
err_nexthop_dismiss:
|
|
nsim_nexthop_account(data, nexthop->occ, false, extack);
|
|
return err;
|
|
}
|
|
|
|
static int nsim_nexthop_insert(struct nsim_fib_data *data,
|
|
struct nh_notifier_info *info)
|
|
{
|
|
struct nsim_nexthop *nexthop, *nexthop_old;
|
|
int err;
|
|
|
|
nexthop = nsim_nexthop_create(data, info);
|
|
if (IS_ERR(nexthop))
|
|
return PTR_ERR(nexthop);
|
|
|
|
nexthop_old = rhashtable_lookup_fast(&data->nexthop_ht, &info->id,
|
|
nsim_nexthop_ht_params);
|
|
if (!nexthop_old)
|
|
err = nsim_nexthop_add(data, nexthop, info->extack);
|
|
else
|
|
err = nsim_nexthop_replace(data, nexthop, nexthop_old,
|
|
info->extack);
|
|
|
|
if (err)
|
|
nsim_nexthop_destroy(nexthop);
|
|
|
|
return err;
|
|
}
|
|
|
|
static void nsim_nexthop_remove(struct nsim_fib_data *data,
|
|
struct nh_notifier_info *info)
|
|
{
|
|
struct nsim_nexthop *nexthop;
|
|
|
|
nexthop = rhashtable_lookup_fast(&data->nexthop_ht, &info->id,
|
|
nsim_nexthop_ht_params);
|
|
if (!nexthop)
|
|
return;
|
|
|
|
rhashtable_remove_fast(&data->nexthop_ht, &nexthop->ht_node,
|
|
nsim_nexthop_ht_params);
|
|
nsim_nexthop_account(data, nexthop->occ, false, info->extack);
|
|
nsim_nexthop_destroy(nexthop);
|
|
}
|
|
|
|
static int nsim_nexthop_res_table_pre_replace(struct nsim_fib_data *data,
|
|
struct nh_notifier_info *info)
|
|
{
|
|
if (data->fail_res_nexthop_group_replace) {
|
|
NL_SET_ERR_MSG_MOD(info->extack, "Failed to replace a resilient nexthop group");
|
|
return -EINVAL;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int nsim_nexthop_bucket_replace(struct nsim_fib_data *data,
|
|
struct nh_notifier_info *info)
|
|
{
|
|
if (data->fail_nexthop_bucket_replace) {
|
|
NL_SET_ERR_MSG_MOD(info->extack, "Failed to replace nexthop bucket");
|
|
return -EINVAL;
|
|
}
|
|
|
|
nexthop_bucket_set_hw_flags(info->net, info->id,
|
|
info->nh_res_bucket->bucket_index,
|
|
false, true);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int nsim_nexthop_event_nb(struct notifier_block *nb, unsigned long event,
|
|
void *ptr)
|
|
{
|
|
struct nsim_fib_data *data = container_of(nb, struct nsim_fib_data,
|
|
nexthop_nb);
|
|
struct nh_notifier_info *info = ptr;
|
|
int err = 0;
|
|
|
|
mutex_lock(&data->nh_lock);
|
|
switch (event) {
|
|
case NEXTHOP_EVENT_REPLACE:
|
|
err = nsim_nexthop_insert(data, info);
|
|
break;
|
|
case NEXTHOP_EVENT_DEL:
|
|
nsim_nexthop_remove(data, info);
|
|
break;
|
|
case NEXTHOP_EVENT_RES_TABLE_PRE_REPLACE:
|
|
err = nsim_nexthop_res_table_pre_replace(data, info);
|
|
break;
|
|
case NEXTHOP_EVENT_BUCKET_REPLACE:
|
|
err = nsim_nexthop_bucket_replace(data, info);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
mutex_unlock(&data->nh_lock);
|
|
return notifier_from_errno(err);
|
|
}
|
|
|
|
static void nsim_nexthop_free(void *ptr, void *arg)
|
|
{
|
|
struct nsim_nexthop *nexthop = ptr;
|
|
struct nsim_fib_data *data = arg;
|
|
struct net *net;
|
|
|
|
net = devlink_net(data->devlink);
|
|
nsim_nexthop_hw_flags_set(net, nexthop, false);
|
|
nsim_nexthop_account(data, nexthop->occ, false, NULL);
|
|
nsim_nexthop_destroy(nexthop);
|
|
}
|
|
|
|
static ssize_t nsim_nexthop_bucket_activity_write(struct file *file,
|
|
const char __user *user_buf,
|
|
size_t size, loff_t *ppos)
|
|
{
|
|
struct nsim_fib_data *data = file->private_data;
|
|
struct net *net = devlink_net(data->devlink);
|
|
struct nsim_nexthop *nexthop;
|
|
unsigned long *activity;
|
|
loff_t pos = *ppos;
|
|
u16 bucket_index;
|
|
char buf[128];
|
|
int err = 0;
|
|
u32 nhid;
|
|
|
|
if (pos != 0)
|
|
return -EINVAL;
|
|
if (size > sizeof(buf))
|
|
return -EINVAL;
|
|
if (copy_from_user(buf, user_buf, size))
|
|
return -EFAULT;
|
|
if (sscanf(buf, "%u %hu", &nhid, &bucket_index) != 2)
|
|
return -EINVAL;
|
|
|
|
rtnl_lock();
|
|
|
|
nexthop = rhashtable_lookup_fast(&data->nexthop_ht, &nhid,
|
|
nsim_nexthop_ht_params);
|
|
if (!nexthop || !nexthop->is_resilient ||
|
|
bucket_index >= nexthop->occ) {
|
|
err = -EINVAL;
|
|
goto out;
|
|
}
|
|
|
|
activity = bitmap_zalloc(nexthop->occ, GFP_KERNEL);
|
|
if (!activity) {
|
|
err = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
bitmap_set(activity, bucket_index, 1);
|
|
nexthop_res_grp_activity_update(net, nhid, nexthop->occ, activity);
|
|
bitmap_free(activity);
|
|
|
|
out:
|
|
rtnl_unlock();
|
|
|
|
*ppos = size;
|
|
return err ?: size;
|
|
}
|
|
|
|
static const struct file_operations nsim_nexthop_bucket_activity_fops = {
|
|
.open = simple_open,
|
|
.write = nsim_nexthop_bucket_activity_write,
|
|
.llseek = no_llseek,
|
|
.owner = THIS_MODULE,
|
|
};
|
|
|
|
static u64 nsim_fib_ipv4_resource_occ_get(void *priv)
|
|
{
|
|
struct nsim_fib_data *data = priv;
|
|
|
|
return nsim_fib_get_val(data, NSIM_RESOURCE_IPV4_FIB, false);
|
|
}
|
|
|
|
static u64 nsim_fib_ipv4_rules_res_occ_get(void *priv)
|
|
{
|
|
struct nsim_fib_data *data = priv;
|
|
|
|
return nsim_fib_get_val(data, NSIM_RESOURCE_IPV4_FIB_RULES, false);
|
|
}
|
|
|
|
static u64 nsim_fib_ipv6_resource_occ_get(void *priv)
|
|
{
|
|
struct nsim_fib_data *data = priv;
|
|
|
|
return nsim_fib_get_val(data, NSIM_RESOURCE_IPV6_FIB, false);
|
|
}
|
|
|
|
static u64 nsim_fib_ipv6_rules_res_occ_get(void *priv)
|
|
{
|
|
struct nsim_fib_data *data = priv;
|
|
|
|
return nsim_fib_get_val(data, NSIM_RESOURCE_IPV6_FIB_RULES, false);
|
|
}
|
|
|
|
static u64 nsim_fib_nexthops_res_occ_get(void *priv)
|
|
{
|
|
struct nsim_fib_data *data = priv;
|
|
|
|
return nsim_fib_get_val(data, NSIM_RESOURCE_NEXTHOPS, false);
|
|
}
|
|
|
|
static void nsim_fib_set_max_all(struct nsim_fib_data *data,
|
|
struct devlink *devlink)
|
|
{
|
|
enum nsim_resource_id res_ids[] = {
|
|
NSIM_RESOURCE_IPV4_FIB, NSIM_RESOURCE_IPV4_FIB_RULES,
|
|
NSIM_RESOURCE_IPV6_FIB, NSIM_RESOURCE_IPV6_FIB_RULES,
|
|
NSIM_RESOURCE_NEXTHOPS,
|
|
};
|
|
int i;
|
|
|
|
for (i = 0; i < ARRAY_SIZE(res_ids); i++) {
|
|
int err;
|
|
u64 val;
|
|
|
|
err = devlink_resource_size_get(devlink, res_ids[i], &val);
|
|
if (err)
|
|
val = (u64) -1;
|
|
nsim_fib_set_max(data, res_ids[i], val);
|
|
}
|
|
}
|
|
|
|
static void nsim_fib_event_work(struct work_struct *work)
|
|
{
|
|
struct nsim_fib_data *data = container_of(work, struct nsim_fib_data,
|
|
fib_event_work);
|
|
struct nsim_fib_event *fib_event, *next_fib_event;
|
|
|
|
LIST_HEAD(fib_event_queue);
|
|
|
|
spin_lock_bh(&data->fib_event_queue_lock);
|
|
list_splice_init(&data->fib_event_queue, &fib_event_queue);
|
|
spin_unlock_bh(&data->fib_event_queue_lock);
|
|
|
|
mutex_lock(&data->fib_lock);
|
|
list_for_each_entry_safe(fib_event, next_fib_event, &fib_event_queue,
|
|
list) {
|
|
nsim_fib_event(fib_event);
|
|
list_del(&fib_event->list);
|
|
kfree(fib_event);
|
|
cond_resched();
|
|
}
|
|
mutex_unlock(&data->fib_lock);
|
|
}
|
|
|
|
static int
|
|
nsim_fib_debugfs_init(struct nsim_fib_data *data, struct nsim_dev *nsim_dev)
|
|
{
|
|
data->ddir = debugfs_create_dir("fib", nsim_dev->ddir);
|
|
if (IS_ERR(data->ddir))
|
|
return PTR_ERR(data->ddir);
|
|
|
|
data->fail_route_offload = false;
|
|
debugfs_create_bool("fail_route_offload", 0600, data->ddir,
|
|
&data->fail_route_offload);
|
|
|
|
data->fail_res_nexthop_group_replace = false;
|
|
debugfs_create_bool("fail_res_nexthop_group_replace", 0600, data->ddir,
|
|
&data->fail_res_nexthop_group_replace);
|
|
|
|
data->fail_nexthop_bucket_replace = false;
|
|
debugfs_create_bool("fail_nexthop_bucket_replace", 0600, data->ddir,
|
|
&data->fail_nexthop_bucket_replace);
|
|
|
|
debugfs_create_file("nexthop_bucket_activity", 0200, data->ddir,
|
|
data, &nsim_nexthop_bucket_activity_fops);
|
|
return 0;
|
|
}
|
|
|
|
static void nsim_fib_debugfs_exit(struct nsim_fib_data *data)
|
|
{
|
|
debugfs_remove_recursive(data->ddir);
|
|
}
|
|
|
|
struct nsim_fib_data *nsim_fib_create(struct devlink *devlink,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
struct nsim_fib_data *data;
|
|
struct nsim_dev *nsim_dev;
|
|
int err;
|
|
|
|
data = kzalloc(sizeof(*data), GFP_KERNEL);
|
|
if (!data)
|
|
return ERR_PTR(-ENOMEM);
|
|
data->devlink = devlink;
|
|
|
|
nsim_dev = devlink_priv(devlink);
|
|
err = nsim_fib_debugfs_init(data, nsim_dev);
|
|
if (err)
|
|
goto err_data_free;
|
|
|
|
mutex_init(&data->nh_lock);
|
|
err = rhashtable_init(&data->nexthop_ht, &nsim_nexthop_ht_params);
|
|
if (err)
|
|
goto err_debugfs_exit;
|
|
|
|
mutex_init(&data->fib_lock);
|
|
INIT_LIST_HEAD(&data->fib_rt_list);
|
|
err = rhashtable_init(&data->fib_rt_ht, &nsim_fib_rt_ht_params);
|
|
if (err)
|
|
goto err_rhashtable_nexthop_destroy;
|
|
|
|
INIT_WORK(&data->fib_event_work, nsim_fib_event_work);
|
|
INIT_LIST_HEAD(&data->fib_event_queue);
|
|
spin_lock_init(&data->fib_event_queue_lock);
|
|
|
|
nsim_fib_set_max_all(data, devlink);
|
|
|
|
data->nexthop_nb.notifier_call = nsim_nexthop_event_nb;
|
|
err = register_nexthop_notifier(devlink_net(devlink), &data->nexthop_nb,
|
|
extack);
|
|
if (err) {
|
|
pr_err("Failed to register nexthop notifier\n");
|
|
goto err_rhashtable_fib_destroy;
|
|
}
|
|
|
|
data->fib_nb.notifier_call = nsim_fib_event_nb;
|
|
err = register_fib_notifier(devlink_net(devlink), &data->fib_nb,
|
|
nsim_fib_dump_inconsistent, extack);
|
|
if (err) {
|
|
pr_err("Failed to register fib notifier\n");
|
|
goto err_nexthop_nb_unregister;
|
|
}
|
|
|
|
devlink_resource_occ_get_register(devlink,
|
|
NSIM_RESOURCE_IPV4_FIB,
|
|
nsim_fib_ipv4_resource_occ_get,
|
|
data);
|
|
devlink_resource_occ_get_register(devlink,
|
|
NSIM_RESOURCE_IPV4_FIB_RULES,
|
|
nsim_fib_ipv4_rules_res_occ_get,
|
|
data);
|
|
devlink_resource_occ_get_register(devlink,
|
|
NSIM_RESOURCE_IPV6_FIB,
|
|
nsim_fib_ipv6_resource_occ_get,
|
|
data);
|
|
devlink_resource_occ_get_register(devlink,
|
|
NSIM_RESOURCE_IPV6_FIB_RULES,
|
|
nsim_fib_ipv6_rules_res_occ_get,
|
|
data);
|
|
devlink_resource_occ_get_register(devlink,
|
|
NSIM_RESOURCE_NEXTHOPS,
|
|
nsim_fib_nexthops_res_occ_get,
|
|
data);
|
|
return data;
|
|
|
|
err_nexthop_nb_unregister:
|
|
unregister_nexthop_notifier(devlink_net(devlink), &data->nexthop_nb);
|
|
err_rhashtable_fib_destroy:
|
|
flush_work(&data->fib_event_work);
|
|
rhashtable_free_and_destroy(&data->fib_rt_ht, nsim_fib_rt_free,
|
|
data);
|
|
err_rhashtable_nexthop_destroy:
|
|
rhashtable_free_and_destroy(&data->nexthop_ht, nsim_nexthop_free,
|
|
data);
|
|
mutex_destroy(&data->fib_lock);
|
|
err_debugfs_exit:
|
|
mutex_destroy(&data->nh_lock);
|
|
nsim_fib_debugfs_exit(data);
|
|
err_data_free:
|
|
kfree(data);
|
|
return ERR_PTR(err);
|
|
}
|
|
|
|
void nsim_fib_destroy(struct devlink *devlink, struct nsim_fib_data *data)
|
|
{
|
|
devlink_resource_occ_get_unregister(devlink,
|
|
NSIM_RESOURCE_NEXTHOPS);
|
|
devlink_resource_occ_get_unregister(devlink,
|
|
NSIM_RESOURCE_IPV6_FIB_RULES);
|
|
devlink_resource_occ_get_unregister(devlink,
|
|
NSIM_RESOURCE_IPV6_FIB);
|
|
devlink_resource_occ_get_unregister(devlink,
|
|
NSIM_RESOURCE_IPV4_FIB_RULES);
|
|
devlink_resource_occ_get_unregister(devlink,
|
|
NSIM_RESOURCE_IPV4_FIB);
|
|
unregister_fib_notifier(devlink_net(devlink), &data->fib_nb);
|
|
unregister_nexthop_notifier(devlink_net(devlink), &data->nexthop_nb);
|
|
flush_work(&data->fib_event_work);
|
|
rhashtable_free_and_destroy(&data->fib_rt_ht, nsim_fib_rt_free,
|
|
data);
|
|
rhashtable_free_and_destroy(&data->nexthop_ht, nsim_nexthop_free,
|
|
data);
|
|
WARN_ON_ONCE(!list_empty(&data->fib_event_queue));
|
|
WARN_ON_ONCE(!list_empty(&data->fib_rt_list));
|
|
mutex_destroy(&data->fib_lock);
|
|
mutex_destroy(&data->nh_lock);
|
|
nsim_fib_debugfs_exit(data);
|
|
kfree(data);
|
|
}
|