Commit f66fd2dd authored by David S. Miller's avatar David S. Miller

Merge branch 'skb_hash'

Tom Herbert says:

====================
net: Add rxhash utility hash functions

v3:

There's really nothing specific about rxhash that constrains
it to be a value just for these receive path. Drop the 'rx'
part in utility functions, including skb_get_rxhash. In subsequent
patches, we can change the rxhash and l4_rxhash names also, as
well as abstracting out the interface to the hash.

Added comments about hash types per feedback.

In this version I'm omitting the changes to drivers to make the
patch set manageable. Will add those changes in followup pathes.

-----
This patch series introduce skb_set_rxhash and skb_clear_rxhash
which are called to set the rxhash (from network drivers) and
to clear the rxhash. This API should be used instead of updating
fields in the skbuff directly.
====================
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parents 1aee6cc2 3df7a74e
...@@ -224,7 +224,7 @@ static struct macvtap_queue *macvtap_get_queue(struct net_device *dev, ...@@ -224,7 +224,7 @@ static struct macvtap_queue *macvtap_get_queue(struct net_device *dev,
goto out; goto out;
/* Check if we can use flow to select a queue */ /* Check if we can use flow to select a queue */
rxq = skb_get_rxhash(skb); rxq = skb_get_hash(skb);
if (rxq) { if (rxq) {
tap = rcu_dereference(vlan->taps[rxq % numvtaps]); tap = rcu_dereference(vlan->taps[rxq % numvtaps]);
goto out; goto out;
......
...@@ -358,7 +358,7 @@ static u16 tun_select_queue(struct net_device *dev, struct sk_buff *skb) ...@@ -358,7 +358,7 @@ static u16 tun_select_queue(struct net_device *dev, struct sk_buff *skb)
rcu_read_lock(); rcu_read_lock();
numqueues = ACCESS_ONCE(tun->numqueues); numqueues = ACCESS_ONCE(tun->numqueues);
txq = skb_get_rxhash(skb); txq = skb_get_hash(skb);
if (txq) { if (txq) {
e = tun_flow_find(&tun->flows[tun_hashfn(txq)], txq); e = tun_flow_find(&tun->flows[tun_hashfn(txq)], txq);
if (e) if (e)
...@@ -1146,7 +1146,7 @@ static ssize_t tun_get_user(struct tun_struct *tun, struct tun_file *tfile, ...@@ -1146,7 +1146,7 @@ static ssize_t tun_get_user(struct tun_struct *tun, struct tun_file *tfile,
skb_reset_network_header(skb); skb_reset_network_header(skb);
skb_probe_transport_header(skb, 0); skb_probe_transport_header(skb, 0);
rxhash = skb_get_rxhash(skb); rxhash = skb_get_hash(skb);
netif_rx_ni(skb); netif_rx_ni(skb);
tun->dev->stats.rx_packets++; tun->dev->stats.rx_packets++;
......
...@@ -1405,7 +1405,7 @@ __be16 vxlan_src_port(__u16 port_min, __u16 port_max, struct sk_buff *skb) ...@@ -1405,7 +1405,7 @@ __be16 vxlan_src_port(__u16 port_min, __u16 port_max, struct sk_buff *skb)
unsigned int range = (port_max - port_min) + 1; unsigned int range = (port_max - port_min) + 1;
u32 hash; u32 hash;
hash = skb_get_rxhash(skb); hash = skb_get_hash(skb);
if (!hash) if (!hash)
hash = jhash(skb->data, 2 * ETH_ALEN, hash = jhash(skb->data, 2 * ETH_ALEN,
(__force u32) skb->protocol); (__force u32) skb->protocol);
......
...@@ -703,15 +703,73 @@ unsigned int skb_find_text(struct sk_buff *skb, unsigned int from, ...@@ -703,15 +703,73 @@ unsigned int skb_find_text(struct sk_buff *skb, unsigned int from,
unsigned int to, struct ts_config *config, unsigned int to, struct ts_config *config,
struct ts_state *state); struct ts_state *state);
void __skb_get_rxhash(struct sk_buff *skb); /*
static inline __u32 skb_get_rxhash(struct sk_buff *skb) * Packet hash types specify the type of hash in skb_set_hash.
*
* Hash types refer to the protocol layer addresses which are used to
* construct a packet's hash. The hashes are used to differentiate or identify
* flows of the protocol layer for the hash type. Hash types are either
* layer-2 (L2), layer-3 (L3), or layer-4 (L4).
*
* Properties of hashes:
*
* 1) Two packets in different flows have different hash values
* 2) Two packets in the same flow should have the same hash value
*
* A hash at a higher layer is considered to be more specific. A driver should
* set the most specific hash possible.
*
* A driver cannot indicate a more specific hash than the layer at which a hash
* was computed. For instance an L3 hash cannot be set as an L4 hash.
*
* A driver may indicate a hash level which is less specific than the
* actual layer the hash was computed on. For instance, a hash computed
* at L4 may be considered an L3 hash. This should only be done if the
* driver can't unambiguously determine that the HW computed the hash at
* the higher layer. Note that the "should" in the second property above
* permits this.
*/
enum pkt_hash_types {
PKT_HASH_TYPE_NONE, /* Undefined type */
PKT_HASH_TYPE_L2, /* Input: src_MAC, dest_MAC */
PKT_HASH_TYPE_L3, /* Input: src_IP, dst_IP */
PKT_HASH_TYPE_L4, /* Input: src_IP, dst_IP, src_port, dst_port */
};
static inline void
skb_set_hash(struct sk_buff *skb, __u32 hash, enum pkt_hash_types type)
{
skb->l4_rxhash = (type == PKT_HASH_TYPE_L4);
skb->rxhash = hash;
}
void __skb_get_hash(struct sk_buff *skb);
static inline __u32 skb_get_hash(struct sk_buff *skb)
{ {
if (!skb->l4_rxhash) if (!skb->l4_rxhash)
__skb_get_rxhash(skb); __skb_get_hash(skb);
return skb->rxhash; return skb->rxhash;
} }
static inline void skb_clear_hash(struct sk_buff *skb)
{
skb->rxhash = 0;
skb->l4_rxhash = 0;
}
static inline void skb_clear_hash_if_not_l4(struct sk_buff *skb)
{
if (!skb->l4_rxhash)
skb_clear_hash(skb);
}
static inline void skb_copy_hash(struct sk_buff *to, const struct sk_buff *from)
{
to->rxhash = from->rxhash;
to->l4_rxhash = from->l4_rxhash;
};
#ifdef NET_SKBUFF_DATA_USES_OFFSET #ifdef NET_SKBUFF_DATA_USES_OFFSET
static inline unsigned char *skb_end_pointer(const struct sk_buff *skb) static inline unsigned char *skb_end_pointer(const struct sk_buff *skb)
{ {
......
...@@ -322,12 +322,11 @@ static inline void __skb_tunnel_rx(struct sk_buff *skb, struct net_device *dev, ...@@ -322,12 +322,11 @@ static inline void __skb_tunnel_rx(struct sk_buff *skb, struct net_device *dev,
skb->dev = dev; skb->dev = dev;
/* /*
* Clear rxhash so that we can recalulate the hash for the * Clear hash so that we can recalulate the hash for the
* encapsulated packet, unless we have already determine the hash * encapsulated packet, unless we have already determine the hash
* over the L4 4-tuple. * over the L4 4-tuple.
*/ */
if (!skb->l4_rxhash) skb_clear_hash_if_not_l4(skb);
skb->rxhash = 0;
skb_set_queue_mapping(skb, 0); skb_set_queue_mapping(skb, 0);
skb_scrub_packet(skb, !net_eq(net, dev_net(dev))); skb_scrub_packet(skb, !net_eq(net, dev_net(dev)));
} }
......
...@@ -3006,7 +3006,7 @@ static int get_rps_cpu(struct net_device *dev, struct sk_buff *skb, ...@@ -3006,7 +3006,7 @@ static int get_rps_cpu(struct net_device *dev, struct sk_buff *skb,
} }
skb_reset_network_header(skb); skb_reset_network_header(skb);
if (!skb_get_rxhash(skb)) if (!skb_get_hash(skb))
goto done; goto done;
flow_table = rcu_dereference(rxqueue->rps_flow_table); flow_table = rcu_dereference(rxqueue->rps_flow_table);
...@@ -3151,7 +3151,7 @@ static bool skb_flow_limit(struct sk_buff *skb, unsigned int qlen) ...@@ -3151,7 +3151,7 @@ static bool skb_flow_limit(struct sk_buff *skb, unsigned int qlen)
rcu_read_lock(); rcu_read_lock();
fl = rcu_dereference(sd->flow_limit); fl = rcu_dereference(sd->flow_limit);
if (fl) { if (fl) {
new_flow = skb_get_rxhash(skb) & (fl->num_buckets - 1); new_flow = skb_get_hash(skb) & (fl->num_buckets - 1);
old_flow = fl->history[fl->history_head]; old_flow = fl->history[fl->history_head];
fl->history[fl->history_head] = new_flow; fl->history[fl->history_head] = new_flow;
......
...@@ -202,12 +202,12 @@ static __always_inline u32 __flow_hash_1word(u32 a) ...@@ -202,12 +202,12 @@ static __always_inline u32 __flow_hash_1word(u32 a)
} }
/* /*
* __skb_get_rxhash: calculate a flow hash based on src/dst addresses * __skb_get_hash: calculate a flow hash based on src/dst addresses
* and src/dst port numbers. Sets rxhash in skb to non-zero hash value * and src/dst port numbers. Sets rxhash in skb to non-zero hash value
* on success, zero indicates no valid hash. Also, sets l4_rxhash in skb * on success, zero indicates no valid hash. Also, sets l4_rxhash in skb
* if hash is a canonical 4-tuple hash over transport ports. * if hash is a canonical 4-tuple hash over transport ports.
*/ */
void __skb_get_rxhash(struct sk_buff *skb) void __skb_get_hash(struct sk_buff *skb)
{ {
struct flow_keys keys; struct flow_keys keys;
u32 hash; u32 hash;
...@@ -234,7 +234,7 @@ void __skb_get_rxhash(struct sk_buff *skb) ...@@ -234,7 +234,7 @@ void __skb_get_rxhash(struct sk_buff *skb)
skb->rxhash = hash; skb->rxhash = hash;
} }
EXPORT_SYMBOL(__skb_get_rxhash); EXPORT_SYMBOL(__skb_get_hash);
/* /*
* Returns a Tx hash based on the given packet descriptor a Tx queues' number * Returns a Tx hash based on the given packet descriptor a Tx queues' number
......
...@@ -712,9 +712,8 @@ static void __copy_skb_header(struct sk_buff *new, const struct sk_buff *old) ...@@ -712,9 +712,8 @@ static void __copy_skb_header(struct sk_buff *new, const struct sk_buff *old)
new->inner_network_header = old->inner_network_header; new->inner_network_header = old->inner_network_header;
new->inner_mac_header = old->inner_mac_header; new->inner_mac_header = old->inner_mac_header;
skb_dst_copy(new, old); skb_dst_copy(new, old);
new->rxhash = old->rxhash; skb_copy_hash(new, old);
new->ooo_okay = old->ooo_okay; new->ooo_okay = old->ooo_okay;
new->l4_rxhash = old->l4_rxhash;
new->no_fcs = old->no_fcs; new->no_fcs = old->no_fcs;
new->encapsulation = old->encapsulation; new->encapsulation = old->encapsulation;
#ifdef CONFIG_XFRM #ifdef CONFIG_XFRM
......
...@@ -704,7 +704,7 @@ struct sk_buff *ip_check_defrag(struct sk_buff *skb, u32 user) ...@@ -704,7 +704,7 @@ struct sk_buff *ip_check_defrag(struct sk_buff *skb, u32 user)
memset(IPCB(skb), 0, sizeof(struct inet_skb_parm)); memset(IPCB(skb), 0, sizeof(struct inet_skb_parm));
if (ip_defrag(skb, user)) if (ip_defrag(skb, user))
return NULL; return NULL;
skb->rxhash = 0; skb_clear_hash(skb);
} }
} }
return skb; return skb;
......
...@@ -56,7 +56,7 @@ int iptunnel_xmit(struct rtable *rt, struct sk_buff *skb, ...@@ -56,7 +56,7 @@ int iptunnel_xmit(struct rtable *rt, struct sk_buff *skb,
skb_scrub_packet(skb, xnet); skb_scrub_packet(skb, xnet);
skb->rxhash = 0; skb_clear_hash(skb);
skb_dst_set(skb, &rt->dst); skb_dst_set(skb, &rt->dst);
memset(IPCB(skb), 0, sizeof(*IPCB(skb))); memset(IPCB(skb), 0, sizeof(*IPCB(skb)));
...@@ -107,8 +107,7 @@ int iptunnel_pull_header(struct sk_buff *skb, int hdr_len, __be16 inner_proto) ...@@ -107,8 +107,7 @@ int iptunnel_pull_header(struct sk_buff *skb, int hdr_len, __be16 inner_proto)
nf_reset(skb); nf_reset(skb);
secpath_reset(skb); secpath_reset(skb);
if (!skb->l4_rxhash) skb_clear_hash_if_not_l4(skb);
skb->rxhash = 0;
skb_dst_drop(skb); skb_dst_drop(skb);
skb->vlan_tci = 0; skb->vlan_tci = 0;
skb_set_queue_mapping(skb, 0); skb_set_queue_mapping(skb, 0);
......
...@@ -165,7 +165,7 @@ static void set_ip_addr(struct sk_buff *skb, struct iphdr *nh, ...@@ -165,7 +165,7 @@ static void set_ip_addr(struct sk_buff *skb, struct iphdr *nh,
} }
csum_replace4(&nh->check, *addr, new_addr); csum_replace4(&nh->check, *addr, new_addr);
skb->rxhash = 0; skb_clear_hash(skb);
*addr = new_addr; *addr = new_addr;
} }
...@@ -199,7 +199,7 @@ static void set_ipv6_addr(struct sk_buff *skb, u8 l4_proto, ...@@ -199,7 +199,7 @@ static void set_ipv6_addr(struct sk_buff *skb, u8 l4_proto,
if (recalculate_csum) if (recalculate_csum)
update_ipv6_checksum(skb, l4_proto, addr, new_addr); update_ipv6_checksum(skb, l4_proto, addr, new_addr);
skb->rxhash = 0; skb_clear_hash(skb);
memcpy(addr, new_addr, sizeof(__be32[4])); memcpy(addr, new_addr, sizeof(__be32[4]));
} }
...@@ -296,7 +296,7 @@ static void set_tp_port(struct sk_buff *skb, __be16 *port, ...@@ -296,7 +296,7 @@ static void set_tp_port(struct sk_buff *skb, __be16 *port,
{ {
inet_proto_csum_replace2(check, skb, *port, new_port, 0); inet_proto_csum_replace2(check, skb, *port, new_port, 0);
*port = new_port; *port = new_port;
skb->rxhash = 0; skb_clear_hash(skb);
} }
static void set_udp_port(struct sk_buff *skb, __be16 *port, __be16 new_port) static void set_udp_port(struct sk_buff *skb, __be16 *port, __be16 new_port)
...@@ -310,7 +310,7 @@ static void set_udp_port(struct sk_buff *skb, __be16 *port, __be16 new_port) ...@@ -310,7 +310,7 @@ static void set_udp_port(struct sk_buff *skb, __be16 *port, __be16 new_port)
uh->check = CSUM_MANGLED_0; uh->check = CSUM_MANGLED_0;
} else { } else {
*port = new_port; *port = new_port;
skb->rxhash = 0; skb_clear_hash(skb);
} }
} }
...@@ -381,7 +381,7 @@ static int set_sctp(struct sk_buff *skb, ...@@ -381,7 +381,7 @@ static int set_sctp(struct sk_buff *skb,
/* Carry any checksum errors through. */ /* Carry any checksum errors through. */
sh->checksum = old_csum ^ old_correct_csum ^ new_csum; sh->checksum = old_csum ^ old_correct_csum ^ new_csum;
skb->rxhash = 0; skb_clear_hash(skb);
} }
return 0; return 0;
......
...@@ -963,7 +963,7 @@ static void prb_clear_blk_fill_status(struct packet_ring_buffer *rb) ...@@ -963,7 +963,7 @@ static void prb_clear_blk_fill_status(struct packet_ring_buffer *rb)
static void prb_fill_rxhash(struct tpacket_kbdq_core *pkc, static void prb_fill_rxhash(struct tpacket_kbdq_core *pkc,
struct tpacket3_hdr *ppd) struct tpacket3_hdr *ppd)
{ {
ppd->hv1.tp_rxhash = skb_get_rxhash(pkc->skb); ppd->hv1.tp_rxhash = skb_get_hash(pkc->skb);
} }
static void prb_clear_rxhash(struct tpacket_kbdq_core *pkc, static void prb_clear_rxhash(struct tpacket_kbdq_core *pkc,
...@@ -1295,7 +1295,7 @@ static int packet_rcv_fanout(struct sk_buff *skb, struct net_device *dev, ...@@ -1295,7 +1295,7 @@ static int packet_rcv_fanout(struct sk_buff *skb, struct net_device *dev,
if (!skb) if (!skb)
return 0; return 0;
} }
skb_get_rxhash(skb); skb_get_hash(skb);
idx = fanout_demux_hash(f, skb, num); idx = fanout_demux_hash(f, skb, num);
break; break;
case PACKET_FANOUT_LB: case PACKET_FANOUT_LB:
......
...@@ -220,7 +220,7 @@ static u32 flow_get_vlan_tag(const struct sk_buff *skb) ...@@ -220,7 +220,7 @@ static u32 flow_get_vlan_tag(const struct sk_buff *skb)
static u32 flow_get_rxhash(struct sk_buff *skb) static u32 flow_get_rxhash(struct sk_buff *skb)
{ {
return skb_get_rxhash(skb); return skb_get_hash(skb);
} }
static u32 flow_key_get(struct sk_buff *skb, int key, struct flow_keys *flow) static u32 flow_key_get(struct sk_buff *skb, int key, struct flow_keys *flow)
......
...@@ -222,7 +222,7 @@ META_COLLECTOR(int_maclen) ...@@ -222,7 +222,7 @@ META_COLLECTOR(int_maclen)
META_COLLECTOR(int_rxhash) META_COLLECTOR(int_rxhash)
{ {
dst->value = skb_get_rxhash(skb); dst->value = skb_get_hash(skb);
} }
/************************************************************************** /**************************************************************************
......
...@@ -226,7 +226,7 @@ static struct fq_flow *fq_classify(struct sk_buff *skb, struct fq_sched_data *q) ...@@ -226,7 +226,7 @@ static struct fq_flow *fq_classify(struct sk_buff *skb, struct fq_sched_data *q)
/* By forcing low order bit to 1, we make sure to not /* By forcing low order bit to 1, we make sure to not
* collide with a local flow (socket pointers are word aligned) * collide with a local flow (socket pointers are word aligned)
*/ */
sk = (struct sock *)(skb_get_rxhash(skb) | 1L); sk = (struct sock *)(skb_get_hash(skb) | 1L);
} }
root = &q->fq_root[hash_32((u32)(long)sk, q->fq_trees_log)]; root = &q->fq_root[hash_32((u32)(long)sk, q->fq_trees_log)];
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment