Commit 15f926c4 authored by Eric Dumazet's avatar Eric Dumazet Committed by David S. Miller

ipv6: lockless IPV6_MTU implementation

np->frag_size can be read/written without holding socket lock.

Add missing annotations and make IPV6_MTU setsockopt() lockless.
Signed-off-by: default avatarEric Dumazet <edumazet@google.com>
Reviewed-by: default avatarDavid Ahern <dsahern@kernel.org>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent 2da23eb0
...@@ -881,9 +881,11 @@ int ip6_fragment(struct net *net, struct sock *sk, struct sk_buff *skb, ...@@ -881,9 +881,11 @@ int ip6_fragment(struct net *net, struct sock *sk, struct sk_buff *skb,
mtu = IPV6_MIN_MTU; mtu = IPV6_MIN_MTU;
} }
if (np && np->frag_size < mtu) { if (np) {
if (np->frag_size) u32 frag_size = READ_ONCE(np->frag_size);
mtu = np->frag_size;
if (frag_size && frag_size < mtu)
mtu = frag_size;
} }
if (mtu < hlen + sizeof(struct frag_hdr) + 8) if (mtu < hlen + sizeof(struct frag_hdr) + 8)
goto fail_toobig; goto fail_toobig;
...@@ -1392,7 +1394,7 @@ static int ip6_setup_cork(struct sock *sk, struct inet_cork_full *cork, ...@@ -1392,7 +1394,7 @@ static int ip6_setup_cork(struct sock *sk, struct inet_cork_full *cork,
struct rt6_info *rt) struct rt6_info *rt)
{ {
struct ipv6_pinfo *np = inet6_sk(sk); struct ipv6_pinfo *np = inet6_sk(sk);
unsigned int mtu; unsigned int mtu, frag_size;
struct ipv6_txoptions *nopt, *opt = ipc6->opt; struct ipv6_txoptions *nopt, *opt = ipc6->opt;
/* callers pass dst together with a reference, set it first so /* callers pass dst together with a reference, set it first so
...@@ -1441,10 +1443,11 @@ static int ip6_setup_cork(struct sock *sk, struct inet_cork_full *cork, ...@@ -1441,10 +1443,11 @@ static int ip6_setup_cork(struct sock *sk, struct inet_cork_full *cork,
else else
mtu = np->pmtudisc >= IPV6_PMTUDISC_PROBE ? mtu = np->pmtudisc >= IPV6_PMTUDISC_PROBE ?
READ_ONCE(rt->dst.dev->mtu) : dst_mtu(xfrm_dst_path(&rt->dst)); READ_ONCE(rt->dst.dev->mtu) : dst_mtu(xfrm_dst_path(&rt->dst));
if (np->frag_size < mtu) {
if (np->frag_size) frag_size = READ_ONCE(np->frag_size);
mtu = np->frag_size; if (frag_size && frag_size < mtu)
} mtu = frag_size;
cork->base.fragsize = mtu; cork->base.fragsize = mtu;
cork->base.gso_size = ipc6->gso_size; cork->base.gso_size = ipc6->gso_size;
cork->base.tx_flags = 0; cork->base.tx_flags = 0;
......
...@@ -441,6 +441,13 @@ int do_ipv6_setsockopt(struct sock *sk, int level, int optname, ...@@ -441,6 +441,13 @@ int do_ipv6_setsockopt(struct sock *sk, int level, int optname,
WRITE_ONCE(np->mcast_hops, WRITE_ONCE(np->mcast_hops,
val == -1 ? IPV6_DEFAULT_MCASTHOPS : val); val == -1 ? IPV6_DEFAULT_MCASTHOPS : val);
return 0; return 0;
case IPV6_MTU:
if (optlen < sizeof(int))
return -EINVAL;
if (val && val < IPV6_MIN_MTU)
return -EINVAL;
WRITE_ONCE(np->frag_size, val);
return 0;
} }
if (needs_rtnl) if (needs_rtnl)
rtnl_lock(); rtnl_lock();
...@@ -910,14 +917,6 @@ int do_ipv6_setsockopt(struct sock *sk, int level, int optname, ...@@ -910,14 +917,6 @@ int do_ipv6_setsockopt(struct sock *sk, int level, int optname,
np->pmtudisc = val; np->pmtudisc = val;
retv = 0; retv = 0;
break; break;
case IPV6_MTU:
if (optlen < sizeof(int))
goto e_inval;
if (val && val < IPV6_MIN_MTU)
goto e_inval;
np->frag_size = val;
retv = 0;
break;
case IPV6_RECVERR: case IPV6_RECVERR:
if (optlen < sizeof(int)) if (optlen < sizeof(int))
goto e_inval; goto e_inval;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment