Commit 5aad1de5 authored by Timo Teräs's avatar Timo Teräs Committed by David S. Miller

ipv4: use separate genid for next hop exceptions

commit 13d82bf5 (ipv4: Fix flushing of cached routing informations)
added the support to flush learned pmtu information.

However, using rt_genid is quite heavy as it is bumped on route
add/change and multicast events amongst other places. These can
happen quite often, especially if using dynamic routing protocols.

While this is ok with routes (as they are just recreated locally),
the pmtu information is learned from remote systems and the icmp
notification can come with long delays. It is worthy to have separate
genid to avoid excessive pmtu resets.

Cc: Steffen Klassert <steffen.klassert@secunet.com>
Signed-off-by: default avatarTimo Teräs <timo.teras@iki.fi>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent f016229e
...@@ -51,6 +51,7 @@ struct rtable; ...@@ -51,6 +51,7 @@ struct rtable;
struct fib_nh_exception { struct fib_nh_exception {
struct fib_nh_exception __rcu *fnhe_next; struct fib_nh_exception __rcu *fnhe_next;
int fnhe_genid;
__be32 fnhe_daddr; __be32 fnhe_daddr;
u32 fnhe_pmtu; u32 fnhe_pmtu;
__be32 fnhe_gw; __be32 fnhe_gw;
......
...@@ -118,6 +118,7 @@ struct net { ...@@ -118,6 +118,7 @@ struct net {
struct netns_ipvs *ipvs; struct netns_ipvs *ipvs;
struct sock *diag_nlsk; struct sock *diag_nlsk;
atomic_t rt_genid; atomic_t rt_genid;
atomic_t fnhe_genid;
}; };
/* /*
...@@ -340,4 +341,14 @@ static inline void rt_genid_bump(struct net *net) ...@@ -340,4 +341,14 @@ static inline void rt_genid_bump(struct net *net)
atomic_inc(&net->rt_genid); atomic_inc(&net->rt_genid);
} }
static inline int fnhe_genid(struct net *net)
{
return atomic_read(&net->fnhe_genid);
}
static inline void fnhe_genid_bump(struct net *net)
{
atomic_inc(&net->fnhe_genid);
}
#endif /* __NET_NET_NAMESPACE_H */ #endif /* __NET_NET_NAMESPACE_H */
...@@ -658,6 +658,7 @@ static void update_or_create_fnhe(struct fib_nh *nh, __be32 daddr, __be32 gw, ...@@ -658,6 +658,7 @@ static void update_or_create_fnhe(struct fib_nh *nh, __be32 daddr, __be32 gw,
fnhe->fnhe_next = hash->chain; fnhe->fnhe_next = hash->chain;
rcu_assign_pointer(hash->chain, fnhe); rcu_assign_pointer(hash->chain, fnhe);
} }
fnhe->fnhe_genid = fnhe_genid(dev_net(nh->nh_dev));
fnhe->fnhe_daddr = daddr; fnhe->fnhe_daddr = daddr;
fnhe->fnhe_gw = gw; fnhe->fnhe_gw = gw;
fnhe->fnhe_pmtu = pmtu; fnhe->fnhe_pmtu = pmtu;
...@@ -1236,8 +1237,11 @@ static bool rt_bind_exception(struct rtable *rt, struct fib_nh_exception *fnhe, ...@@ -1236,8 +1237,11 @@ static bool rt_bind_exception(struct rtable *rt, struct fib_nh_exception *fnhe,
spin_lock_bh(&fnhe_lock); spin_lock_bh(&fnhe_lock);
if (daddr == fnhe->fnhe_daddr) { if (daddr == fnhe->fnhe_daddr) {
int genid = fnhe_genid(dev_net(rt->dst.dev));
struct rtable *orig = rcu_dereference(fnhe->fnhe_rth); struct rtable *orig = rcu_dereference(fnhe->fnhe_rth);
if (orig && rt_is_expired(orig)) {
if (fnhe->fnhe_genid != genid) {
fnhe->fnhe_genid = genid;
fnhe->fnhe_gw = 0; fnhe->fnhe_gw = 0;
fnhe->fnhe_pmtu = 0; fnhe->fnhe_pmtu = 0;
fnhe->fnhe_expires = 0; fnhe->fnhe_expires = 0;
...@@ -2443,8 +2447,11 @@ static int ipv4_sysctl_rtcache_flush(ctl_table *__ctl, int write, ...@@ -2443,8 +2447,11 @@ static int ipv4_sysctl_rtcache_flush(ctl_table *__ctl, int write,
void __user *buffer, void __user *buffer,
size_t *lenp, loff_t *ppos) size_t *lenp, loff_t *ppos)
{ {
struct net *net = (struct net *)__ctl->extra1;
if (write) { if (write) {
rt_cache_flush((struct net *)__ctl->extra1); rt_cache_flush(net);
fnhe_genid_bump(net);
return 0; return 0;
} }
...@@ -2619,6 +2626,7 @@ static __net_initdata struct pernet_operations sysctl_route_ops = { ...@@ -2619,6 +2626,7 @@ static __net_initdata struct pernet_operations sysctl_route_ops = {
static __net_init int rt_genid_init(struct net *net) static __net_init int rt_genid_init(struct net *net)
{ {
atomic_set(&net->rt_genid, 0); atomic_set(&net->rt_genid, 0);
atomic_set(&net->fnhe_genid, 0);
get_random_bytes(&net->ipv4.dev_addr_genid, get_random_bytes(&net->ipv4.dev_addr_genid,
sizeof(net->ipv4.dev_addr_genid)); sizeof(net->ipv4.dev_addr_genid));
return 0; return 0;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment