powerpc/powernv: Report size of OPAL memcons log
[linux/fpc-iii.git] / net / core / flow_dissector.c
blob1b7673aac59d51a5f8b5ef3f2076f1440c017fae
1 #include <linux/kernel.h>
2 #include <linux/skbuff.h>
3 #include <linux/export.h>
4 #include <linux/ip.h>
5 #include <linux/ipv6.h>
6 #include <linux/if_vlan.h>
7 #include <net/ip.h>
8 #include <net/ipv6.h>
9 #include <net/gre.h>
10 #include <net/pptp.h>
11 #include <linux/igmp.h>
12 #include <linux/icmp.h>
13 #include <linux/sctp.h>
14 #include <linux/dccp.h>
15 #include <linux/if_tunnel.h>
16 #include <linux/if_pppox.h>
17 #include <linux/ppp_defs.h>
18 #include <linux/stddef.h>
19 #include <linux/if_ether.h>
20 #include <linux/mpls.h>
21 #include <net/flow_dissector.h>
22 #include <scsi/fc/fc_fcoe.h>
24 static void dissector_set_key(struct flow_dissector *flow_dissector,
25 enum flow_dissector_key_id key_id)
27 flow_dissector->used_keys |= (1 << key_id);
30 void skb_flow_dissector_init(struct flow_dissector *flow_dissector,
31 const struct flow_dissector_key *key,
32 unsigned int key_count)
34 unsigned int i;
36 memset(flow_dissector, 0, sizeof(*flow_dissector));
38 for (i = 0; i < key_count; i++, key++) {
39 /* User should make sure that every key target offset is withing
40 * boundaries of unsigned short.
42 BUG_ON(key->offset > USHRT_MAX);
43 BUG_ON(dissector_uses_key(flow_dissector,
44 key->key_id));
46 dissector_set_key(flow_dissector, key->key_id);
47 flow_dissector->offset[key->key_id] = key->offset;
50 /* Ensure that the dissector always includes control and basic key.
51 * That way we are able to avoid handling lack of these in fast path.
53 BUG_ON(!dissector_uses_key(flow_dissector,
54 FLOW_DISSECTOR_KEY_CONTROL));
55 BUG_ON(!dissector_uses_key(flow_dissector,
56 FLOW_DISSECTOR_KEY_BASIC));
58 EXPORT_SYMBOL(skb_flow_dissector_init);
60 /**
61 * skb_flow_get_be16 - extract be16 entity
62 * @skb: sk_buff to extract from
63 * @poff: offset to extract at
64 * @data: raw buffer pointer to the packet
65 * @hlen: packet header length
67 * The function will try to retrieve a be32 entity at
68 * offset poff
70 static __be16 skb_flow_get_be16(const struct sk_buff *skb, int poff,
71 void *data, int hlen)
73 __be16 *u, _u;
75 u = __skb_header_pointer(skb, poff, sizeof(_u), data, hlen, &_u);
76 if (u)
77 return *u;
79 return 0;
82 /**
83 * __skb_flow_get_ports - extract the upper layer ports and return them
84 * @skb: sk_buff to extract the ports from
85 * @thoff: transport header offset
86 * @ip_proto: protocol for which to get port offset
87 * @data: raw buffer pointer to the packet, if NULL use skb->data
88 * @hlen: packet header length, if @data is NULL use skb_headlen(skb)
90 * The function will try to retrieve the ports at offset thoff + poff where poff
91 * is the protocol port offset returned from proto_ports_offset
93 __be32 __skb_flow_get_ports(const struct sk_buff *skb, int thoff, u8 ip_proto,
94 void *data, int hlen)
96 int poff = proto_ports_offset(ip_proto);
98 if (!data) {
99 data = skb->data;
100 hlen = skb_headlen(skb);
103 if (poff >= 0) {
104 __be32 *ports, _ports;
106 ports = __skb_header_pointer(skb, thoff + poff,
107 sizeof(_ports), data, hlen, &_ports);
108 if (ports)
109 return *ports;
112 return 0;
114 EXPORT_SYMBOL(__skb_flow_get_ports);
117 * __skb_flow_dissect - extract the flow_keys struct and return it
118 * @skb: sk_buff to extract the flow from, can be NULL if the rest are specified
119 * @flow_dissector: list of keys to dissect
120 * @target_container: target structure to put dissected values into
121 * @data: raw buffer pointer to the packet, if NULL use skb->data
122 * @proto: protocol for which to get the flow, if @data is NULL use skb->protocol
123 * @nhoff: network header offset, if @data is NULL use skb_network_offset(skb)
124 * @hlen: packet header length, if @data is NULL use skb_headlen(skb)
126 * The function will try to retrieve individual keys into target specified
127 * by flow_dissector from either the skbuff or a raw buffer specified by the
128 * rest parameters.
130 * Caller must take care of zeroing target container memory.
132 bool __skb_flow_dissect(const struct sk_buff *skb,
133 struct flow_dissector *flow_dissector,
134 void *target_container,
135 void *data, __be16 proto, int nhoff, int hlen,
136 unsigned int flags)
138 struct flow_dissector_key_control *key_control;
139 struct flow_dissector_key_basic *key_basic;
140 struct flow_dissector_key_addrs *key_addrs;
141 struct flow_dissector_key_ports *key_ports;
142 struct flow_dissector_key_icmp *key_icmp;
143 struct flow_dissector_key_tags *key_tags;
144 struct flow_dissector_key_vlan *key_vlan;
145 struct flow_dissector_key_keyid *key_keyid;
146 bool skip_vlan = false;
147 u8 ip_proto = 0;
148 bool ret;
150 if (!data) {
151 data = skb->data;
152 proto = skb_vlan_tag_present(skb) ?
153 skb->vlan_proto : skb->protocol;
154 nhoff = skb_network_offset(skb);
155 hlen = skb_headlen(skb);
158 /* It is ensured by skb_flow_dissector_init() that control key will
159 * be always present.
161 key_control = skb_flow_dissector_target(flow_dissector,
162 FLOW_DISSECTOR_KEY_CONTROL,
163 target_container);
165 /* It is ensured by skb_flow_dissector_init() that basic key will
166 * be always present.
168 key_basic = skb_flow_dissector_target(flow_dissector,
169 FLOW_DISSECTOR_KEY_BASIC,
170 target_container);
172 if (dissector_uses_key(flow_dissector,
173 FLOW_DISSECTOR_KEY_ETH_ADDRS)) {
174 struct ethhdr *eth = eth_hdr(skb);
175 struct flow_dissector_key_eth_addrs *key_eth_addrs;
177 key_eth_addrs = skb_flow_dissector_target(flow_dissector,
178 FLOW_DISSECTOR_KEY_ETH_ADDRS,
179 target_container);
180 memcpy(key_eth_addrs, &eth->h_dest, sizeof(*key_eth_addrs));
183 again:
184 switch (proto) {
185 case htons(ETH_P_IP): {
186 const struct iphdr *iph;
187 struct iphdr _iph;
189 iph = __skb_header_pointer(skb, nhoff, sizeof(_iph), data, hlen, &_iph);
190 if (!iph || iph->ihl < 5)
191 goto out_bad;
192 nhoff += iph->ihl * 4;
194 ip_proto = iph->protocol;
196 if (dissector_uses_key(flow_dissector,
197 FLOW_DISSECTOR_KEY_IPV4_ADDRS)) {
198 key_addrs = skb_flow_dissector_target(flow_dissector,
199 FLOW_DISSECTOR_KEY_IPV4_ADDRS,
200 target_container);
202 memcpy(&key_addrs->v4addrs, &iph->saddr,
203 sizeof(key_addrs->v4addrs));
204 key_control->addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
207 if (ip_is_fragment(iph)) {
208 key_control->flags |= FLOW_DIS_IS_FRAGMENT;
210 if (iph->frag_off & htons(IP_OFFSET)) {
211 goto out_good;
212 } else {
213 key_control->flags |= FLOW_DIS_FIRST_FRAG;
214 if (!(flags & FLOW_DISSECTOR_F_PARSE_1ST_FRAG))
215 goto out_good;
219 if (flags & FLOW_DISSECTOR_F_STOP_AT_L3)
220 goto out_good;
222 break;
224 case htons(ETH_P_IPV6): {
225 const struct ipv6hdr *iph;
226 struct ipv6hdr _iph;
228 ipv6:
229 iph = __skb_header_pointer(skb, nhoff, sizeof(_iph), data, hlen, &_iph);
230 if (!iph)
231 goto out_bad;
233 ip_proto = iph->nexthdr;
234 nhoff += sizeof(struct ipv6hdr);
236 if (dissector_uses_key(flow_dissector,
237 FLOW_DISSECTOR_KEY_IPV6_ADDRS)) {
238 key_addrs = skb_flow_dissector_target(flow_dissector,
239 FLOW_DISSECTOR_KEY_IPV6_ADDRS,
240 target_container);
242 memcpy(&key_addrs->v6addrs, &iph->saddr,
243 sizeof(key_addrs->v6addrs));
244 key_control->addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
247 if ((dissector_uses_key(flow_dissector,
248 FLOW_DISSECTOR_KEY_FLOW_LABEL) ||
249 (flags & FLOW_DISSECTOR_F_STOP_AT_FLOW_LABEL)) &&
250 ip6_flowlabel(iph)) {
251 __be32 flow_label = ip6_flowlabel(iph);
253 if (dissector_uses_key(flow_dissector,
254 FLOW_DISSECTOR_KEY_FLOW_LABEL)) {
255 key_tags = skb_flow_dissector_target(flow_dissector,
256 FLOW_DISSECTOR_KEY_FLOW_LABEL,
257 target_container);
258 key_tags->flow_label = ntohl(flow_label);
260 if (flags & FLOW_DISSECTOR_F_STOP_AT_FLOW_LABEL)
261 goto out_good;
264 if (flags & FLOW_DISSECTOR_F_STOP_AT_L3)
265 goto out_good;
267 break;
269 case htons(ETH_P_8021AD):
270 case htons(ETH_P_8021Q): {
271 const struct vlan_hdr *vlan;
272 struct vlan_hdr _vlan;
273 bool vlan_tag_present = skb && skb_vlan_tag_present(skb);
275 if (vlan_tag_present)
276 proto = skb->protocol;
278 if (!vlan_tag_present || eth_type_vlan(skb->protocol)) {
279 vlan = __skb_header_pointer(skb, nhoff, sizeof(_vlan),
280 data, hlen, &_vlan);
281 if (!vlan)
282 goto out_bad;
283 proto = vlan->h_vlan_encapsulated_proto;
284 nhoff += sizeof(*vlan);
285 if (skip_vlan)
286 goto again;
289 skip_vlan = true;
290 if (dissector_uses_key(flow_dissector,
291 FLOW_DISSECTOR_KEY_VLAN)) {
292 key_vlan = skb_flow_dissector_target(flow_dissector,
293 FLOW_DISSECTOR_KEY_VLAN,
294 target_container);
296 if (vlan_tag_present) {
297 key_vlan->vlan_id = skb_vlan_tag_get_id(skb);
298 key_vlan->vlan_priority =
299 (skb_vlan_tag_get_prio(skb) >> VLAN_PRIO_SHIFT);
300 } else {
301 key_vlan->vlan_id = ntohs(vlan->h_vlan_TCI) &
302 VLAN_VID_MASK;
303 key_vlan->vlan_priority =
304 (ntohs(vlan->h_vlan_TCI) &
305 VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
309 goto again;
311 case htons(ETH_P_PPP_SES): {
312 struct {
313 struct pppoe_hdr hdr;
314 __be16 proto;
315 } *hdr, _hdr;
316 hdr = __skb_header_pointer(skb, nhoff, sizeof(_hdr), data, hlen, &_hdr);
317 if (!hdr)
318 goto out_bad;
319 proto = hdr->proto;
320 nhoff += PPPOE_SES_HLEN;
321 switch (proto) {
322 case htons(PPP_IP):
323 goto ip;
324 case htons(PPP_IPV6):
325 goto ipv6;
326 default:
327 goto out_bad;
330 case htons(ETH_P_TIPC): {
331 struct {
332 __be32 pre[3];
333 __be32 srcnode;
334 } *hdr, _hdr;
335 hdr = __skb_header_pointer(skb, nhoff, sizeof(_hdr), data, hlen, &_hdr);
336 if (!hdr)
337 goto out_bad;
339 if (dissector_uses_key(flow_dissector,
340 FLOW_DISSECTOR_KEY_TIPC_ADDRS)) {
341 key_addrs = skb_flow_dissector_target(flow_dissector,
342 FLOW_DISSECTOR_KEY_TIPC_ADDRS,
343 target_container);
344 key_addrs->tipcaddrs.srcnode = hdr->srcnode;
345 key_control->addr_type = FLOW_DISSECTOR_KEY_TIPC_ADDRS;
347 goto out_good;
350 case htons(ETH_P_MPLS_UC):
351 case htons(ETH_P_MPLS_MC): {
352 struct mpls_label *hdr, _hdr[2];
353 mpls:
354 hdr = __skb_header_pointer(skb, nhoff, sizeof(_hdr), data,
355 hlen, &_hdr);
356 if (!hdr)
357 goto out_bad;
359 if ((ntohl(hdr[0].entry) & MPLS_LS_LABEL_MASK) >>
360 MPLS_LS_LABEL_SHIFT == MPLS_LABEL_ENTROPY) {
361 if (dissector_uses_key(flow_dissector,
362 FLOW_DISSECTOR_KEY_MPLS_ENTROPY)) {
363 key_keyid = skb_flow_dissector_target(flow_dissector,
364 FLOW_DISSECTOR_KEY_MPLS_ENTROPY,
365 target_container);
366 key_keyid->keyid = hdr[1].entry &
367 htonl(MPLS_LS_LABEL_MASK);
370 goto out_good;
373 goto out_good;
376 case htons(ETH_P_FCOE):
377 if ((hlen - nhoff) < FCOE_HEADER_LEN)
378 goto out_bad;
380 nhoff += FCOE_HEADER_LEN;
381 goto out_good;
382 default:
383 goto out_bad;
386 ip_proto_again:
387 switch (ip_proto) {
388 case IPPROTO_GRE: {
389 struct gre_base_hdr *hdr, _hdr;
390 u16 gre_ver;
391 int offset = 0;
393 hdr = __skb_header_pointer(skb, nhoff, sizeof(_hdr), data, hlen, &_hdr);
394 if (!hdr)
395 goto out_bad;
397 /* Only look inside GRE without routing */
398 if (hdr->flags & GRE_ROUTING)
399 break;
401 /* Only look inside GRE for version 0 and 1 */
402 gre_ver = ntohs(hdr->flags & GRE_VERSION);
403 if (gre_ver > 1)
404 break;
406 proto = hdr->protocol;
407 if (gre_ver) {
408 /* Version1 must be PPTP, and check the flags */
409 if (!(proto == GRE_PROTO_PPP && (hdr->flags & GRE_KEY)))
410 break;
413 offset += sizeof(struct gre_base_hdr);
415 if (hdr->flags & GRE_CSUM)
416 offset += sizeof(((struct gre_full_hdr *)0)->csum) +
417 sizeof(((struct gre_full_hdr *)0)->reserved1);
419 if (hdr->flags & GRE_KEY) {
420 const __be32 *keyid;
421 __be32 _keyid;
423 keyid = __skb_header_pointer(skb, nhoff + offset, sizeof(_keyid),
424 data, hlen, &_keyid);
425 if (!keyid)
426 goto out_bad;
428 if (dissector_uses_key(flow_dissector,
429 FLOW_DISSECTOR_KEY_GRE_KEYID)) {
430 key_keyid = skb_flow_dissector_target(flow_dissector,
431 FLOW_DISSECTOR_KEY_GRE_KEYID,
432 target_container);
433 if (gre_ver == 0)
434 key_keyid->keyid = *keyid;
435 else
436 key_keyid->keyid = *keyid & GRE_PPTP_KEY_MASK;
438 offset += sizeof(((struct gre_full_hdr *)0)->key);
441 if (hdr->flags & GRE_SEQ)
442 offset += sizeof(((struct pptp_gre_header *)0)->seq);
444 if (gre_ver == 0) {
445 if (proto == htons(ETH_P_TEB)) {
446 const struct ethhdr *eth;
447 struct ethhdr _eth;
449 eth = __skb_header_pointer(skb, nhoff + offset,
450 sizeof(_eth),
451 data, hlen, &_eth);
452 if (!eth)
453 goto out_bad;
454 proto = eth->h_proto;
455 offset += sizeof(*eth);
457 /* Cap headers that we access via pointers at the
458 * end of the Ethernet header as our maximum alignment
459 * at that point is only 2 bytes.
461 if (NET_IP_ALIGN)
462 hlen = (nhoff + offset);
464 } else { /* version 1, must be PPTP */
465 u8 _ppp_hdr[PPP_HDRLEN];
466 u8 *ppp_hdr;
468 if (hdr->flags & GRE_ACK)
469 offset += sizeof(((struct pptp_gre_header *)0)->ack);
471 ppp_hdr = __skb_header_pointer(skb, nhoff + offset,
472 sizeof(_ppp_hdr),
473 data, hlen, _ppp_hdr);
474 if (!ppp_hdr)
475 goto out_bad;
477 switch (PPP_PROTOCOL(ppp_hdr)) {
478 case PPP_IP:
479 proto = htons(ETH_P_IP);
480 break;
481 case PPP_IPV6:
482 proto = htons(ETH_P_IPV6);
483 break;
484 default:
485 /* Could probably catch some more like MPLS */
486 break;
489 offset += PPP_HDRLEN;
492 nhoff += offset;
493 key_control->flags |= FLOW_DIS_ENCAPSULATION;
494 if (flags & FLOW_DISSECTOR_F_STOP_AT_ENCAP)
495 goto out_good;
497 goto again;
499 case NEXTHDR_HOP:
500 case NEXTHDR_ROUTING:
501 case NEXTHDR_DEST: {
502 u8 _opthdr[2], *opthdr;
504 if (proto != htons(ETH_P_IPV6))
505 break;
507 opthdr = __skb_header_pointer(skb, nhoff, sizeof(_opthdr),
508 data, hlen, &_opthdr);
509 if (!opthdr)
510 goto out_bad;
512 ip_proto = opthdr[0];
513 nhoff += (opthdr[1] + 1) << 3;
515 goto ip_proto_again;
517 case NEXTHDR_FRAGMENT: {
518 struct frag_hdr _fh, *fh;
520 if (proto != htons(ETH_P_IPV6))
521 break;
523 fh = __skb_header_pointer(skb, nhoff, sizeof(_fh),
524 data, hlen, &_fh);
526 if (!fh)
527 goto out_bad;
529 key_control->flags |= FLOW_DIS_IS_FRAGMENT;
531 nhoff += sizeof(_fh);
532 ip_proto = fh->nexthdr;
534 if (!(fh->frag_off & htons(IP6_OFFSET))) {
535 key_control->flags |= FLOW_DIS_FIRST_FRAG;
536 if (flags & FLOW_DISSECTOR_F_PARSE_1ST_FRAG)
537 goto ip_proto_again;
539 goto out_good;
541 case IPPROTO_IPIP:
542 proto = htons(ETH_P_IP);
544 key_control->flags |= FLOW_DIS_ENCAPSULATION;
545 if (flags & FLOW_DISSECTOR_F_STOP_AT_ENCAP)
546 goto out_good;
548 goto ip;
549 case IPPROTO_IPV6:
550 proto = htons(ETH_P_IPV6);
552 key_control->flags |= FLOW_DIS_ENCAPSULATION;
553 if (flags & FLOW_DISSECTOR_F_STOP_AT_ENCAP)
554 goto out_good;
556 goto ipv6;
557 case IPPROTO_MPLS:
558 proto = htons(ETH_P_MPLS_UC);
559 goto mpls;
560 default:
561 break;
564 if (dissector_uses_key(flow_dissector,
565 FLOW_DISSECTOR_KEY_PORTS)) {
566 key_ports = skb_flow_dissector_target(flow_dissector,
567 FLOW_DISSECTOR_KEY_PORTS,
568 target_container);
569 key_ports->ports = __skb_flow_get_ports(skb, nhoff, ip_proto,
570 data, hlen);
573 if (dissector_uses_key(flow_dissector,
574 FLOW_DISSECTOR_KEY_ICMP)) {
575 key_icmp = skb_flow_dissector_target(flow_dissector,
576 FLOW_DISSECTOR_KEY_ICMP,
577 target_container);
578 key_icmp->icmp = skb_flow_get_be16(skb, nhoff, data, hlen);
581 out_good:
582 ret = true;
584 key_control->thoff = (u16)nhoff;
585 out:
586 key_basic->n_proto = proto;
587 key_basic->ip_proto = ip_proto;
589 return ret;
591 out_bad:
592 ret = false;
593 key_control->thoff = min_t(u16, nhoff, skb ? skb->len : hlen);
594 goto out;
596 EXPORT_SYMBOL(__skb_flow_dissect);
598 static u32 hashrnd __read_mostly;
599 static __always_inline void __flow_hash_secret_init(void)
601 net_get_random_once(&hashrnd, sizeof(hashrnd));
604 static __always_inline u32 __flow_hash_words(const u32 *words, u32 length,
605 u32 keyval)
607 return jhash2(words, length, keyval);
610 static inline const u32 *flow_keys_hash_start(const struct flow_keys *flow)
612 const void *p = flow;
614 BUILD_BUG_ON(FLOW_KEYS_HASH_OFFSET % sizeof(u32));
615 return (const u32 *)(p + FLOW_KEYS_HASH_OFFSET);
618 static inline size_t flow_keys_hash_length(const struct flow_keys *flow)
620 size_t diff = FLOW_KEYS_HASH_OFFSET + sizeof(flow->addrs);
621 BUILD_BUG_ON((sizeof(*flow) - FLOW_KEYS_HASH_OFFSET) % sizeof(u32));
622 BUILD_BUG_ON(offsetof(typeof(*flow), addrs) !=
623 sizeof(*flow) - sizeof(flow->addrs));
625 switch (flow->control.addr_type) {
626 case FLOW_DISSECTOR_KEY_IPV4_ADDRS:
627 diff -= sizeof(flow->addrs.v4addrs);
628 break;
629 case FLOW_DISSECTOR_KEY_IPV6_ADDRS:
630 diff -= sizeof(flow->addrs.v6addrs);
631 break;
632 case FLOW_DISSECTOR_KEY_TIPC_ADDRS:
633 diff -= sizeof(flow->addrs.tipcaddrs);
634 break;
636 return (sizeof(*flow) - diff) / sizeof(u32);
639 __be32 flow_get_u32_src(const struct flow_keys *flow)
641 switch (flow->control.addr_type) {
642 case FLOW_DISSECTOR_KEY_IPV4_ADDRS:
643 return flow->addrs.v4addrs.src;
644 case FLOW_DISSECTOR_KEY_IPV6_ADDRS:
645 return (__force __be32)ipv6_addr_hash(
646 &flow->addrs.v6addrs.src);
647 case FLOW_DISSECTOR_KEY_TIPC_ADDRS:
648 return flow->addrs.tipcaddrs.srcnode;
649 default:
650 return 0;
653 EXPORT_SYMBOL(flow_get_u32_src);
655 __be32 flow_get_u32_dst(const struct flow_keys *flow)
657 switch (flow->control.addr_type) {
658 case FLOW_DISSECTOR_KEY_IPV4_ADDRS:
659 return flow->addrs.v4addrs.dst;
660 case FLOW_DISSECTOR_KEY_IPV6_ADDRS:
661 return (__force __be32)ipv6_addr_hash(
662 &flow->addrs.v6addrs.dst);
663 default:
664 return 0;
667 EXPORT_SYMBOL(flow_get_u32_dst);
669 static inline void __flow_hash_consistentify(struct flow_keys *keys)
671 int addr_diff, i;
673 switch (keys->control.addr_type) {
674 case FLOW_DISSECTOR_KEY_IPV4_ADDRS:
675 addr_diff = (__force u32)keys->addrs.v4addrs.dst -
676 (__force u32)keys->addrs.v4addrs.src;
677 if ((addr_diff < 0) ||
678 (addr_diff == 0 &&
679 ((__force u16)keys->ports.dst <
680 (__force u16)keys->ports.src))) {
681 swap(keys->addrs.v4addrs.src, keys->addrs.v4addrs.dst);
682 swap(keys->ports.src, keys->ports.dst);
684 break;
685 case FLOW_DISSECTOR_KEY_IPV6_ADDRS:
686 addr_diff = memcmp(&keys->addrs.v6addrs.dst,
687 &keys->addrs.v6addrs.src,
688 sizeof(keys->addrs.v6addrs.dst));
689 if ((addr_diff < 0) ||
690 (addr_diff == 0 &&
691 ((__force u16)keys->ports.dst <
692 (__force u16)keys->ports.src))) {
693 for (i = 0; i < 4; i++)
694 swap(keys->addrs.v6addrs.src.s6_addr32[i],
695 keys->addrs.v6addrs.dst.s6_addr32[i]);
696 swap(keys->ports.src, keys->ports.dst);
698 break;
702 static inline u32 __flow_hash_from_keys(struct flow_keys *keys, u32 keyval)
704 u32 hash;
706 __flow_hash_consistentify(keys);
708 hash = __flow_hash_words(flow_keys_hash_start(keys),
709 flow_keys_hash_length(keys), keyval);
710 if (!hash)
711 hash = 1;
713 return hash;
716 u32 flow_hash_from_keys(struct flow_keys *keys)
718 __flow_hash_secret_init();
719 return __flow_hash_from_keys(keys, hashrnd);
721 EXPORT_SYMBOL(flow_hash_from_keys);
723 static inline u32 ___skb_get_hash(const struct sk_buff *skb,
724 struct flow_keys *keys, u32 keyval)
726 skb_flow_dissect_flow_keys(skb, keys,
727 FLOW_DISSECTOR_F_STOP_AT_FLOW_LABEL);
729 return __flow_hash_from_keys(keys, keyval);
732 struct _flow_keys_digest_data {
733 __be16 n_proto;
734 u8 ip_proto;
735 u8 padding;
736 __be32 ports;
737 __be32 src;
738 __be32 dst;
741 void make_flow_keys_digest(struct flow_keys_digest *digest,
742 const struct flow_keys *flow)
744 struct _flow_keys_digest_data *data =
745 (struct _flow_keys_digest_data *)digest;
747 BUILD_BUG_ON(sizeof(*data) > sizeof(*digest));
749 memset(digest, 0, sizeof(*digest));
751 data->n_proto = flow->basic.n_proto;
752 data->ip_proto = flow->basic.ip_proto;
753 data->ports = flow->ports.ports;
754 data->src = flow->addrs.v4addrs.src;
755 data->dst = flow->addrs.v4addrs.dst;
757 EXPORT_SYMBOL(make_flow_keys_digest);
759 static struct flow_dissector flow_keys_dissector_symmetric __read_mostly;
761 u32 __skb_get_hash_symmetric(const struct sk_buff *skb)
763 struct flow_keys keys;
765 __flow_hash_secret_init();
767 memset(&keys, 0, sizeof(keys));
768 __skb_flow_dissect(skb, &flow_keys_dissector_symmetric, &keys,
769 NULL, 0, 0, 0,
770 FLOW_DISSECTOR_F_STOP_AT_FLOW_LABEL);
772 return __flow_hash_from_keys(&keys, hashrnd);
774 EXPORT_SYMBOL_GPL(__skb_get_hash_symmetric);
777 * __skb_get_hash: calculate a flow hash
778 * @skb: sk_buff to calculate flow hash from
780 * This function calculates a flow hash based on src/dst addresses
781 * and src/dst port numbers. Sets hash in skb to non-zero hash value
782 * on success, zero indicates no valid hash. Also, sets l4_hash in skb
783 * if hash is a canonical 4-tuple hash over transport ports.
785 void __skb_get_hash(struct sk_buff *skb)
787 struct flow_keys keys;
788 u32 hash;
790 __flow_hash_secret_init();
792 hash = ___skb_get_hash(skb, &keys, hashrnd);
794 __skb_set_sw_hash(skb, hash, flow_keys_have_l4(&keys));
796 EXPORT_SYMBOL(__skb_get_hash);
798 __u32 skb_get_hash_perturb(const struct sk_buff *skb, u32 perturb)
800 struct flow_keys keys;
802 return ___skb_get_hash(skb, &keys, perturb);
804 EXPORT_SYMBOL(skb_get_hash_perturb);
806 __u32 __skb_get_hash_flowi6(struct sk_buff *skb, const struct flowi6 *fl6)
808 struct flow_keys keys;
810 memset(&keys, 0, sizeof(keys));
812 memcpy(&keys.addrs.v6addrs.src, &fl6->saddr,
813 sizeof(keys.addrs.v6addrs.src));
814 memcpy(&keys.addrs.v6addrs.dst, &fl6->daddr,
815 sizeof(keys.addrs.v6addrs.dst));
816 keys.control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
817 keys.ports.src = fl6->fl6_sport;
818 keys.ports.dst = fl6->fl6_dport;
819 keys.keyid.keyid = fl6->fl6_gre_key;
820 keys.tags.flow_label = (__force u32)fl6->flowlabel;
821 keys.basic.ip_proto = fl6->flowi6_proto;
823 __skb_set_sw_hash(skb, flow_hash_from_keys(&keys),
824 flow_keys_have_l4(&keys));
826 return skb->hash;
828 EXPORT_SYMBOL(__skb_get_hash_flowi6);
830 __u32 __skb_get_hash_flowi4(struct sk_buff *skb, const struct flowi4 *fl4)
832 struct flow_keys keys;
834 memset(&keys, 0, sizeof(keys));
836 keys.addrs.v4addrs.src = fl4->saddr;
837 keys.addrs.v4addrs.dst = fl4->daddr;
838 keys.control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
839 keys.ports.src = fl4->fl4_sport;
840 keys.ports.dst = fl4->fl4_dport;
841 keys.keyid.keyid = fl4->fl4_gre_key;
842 keys.basic.ip_proto = fl4->flowi4_proto;
844 __skb_set_sw_hash(skb, flow_hash_from_keys(&keys),
845 flow_keys_have_l4(&keys));
847 return skb->hash;
849 EXPORT_SYMBOL(__skb_get_hash_flowi4);
851 u32 __skb_get_poff(const struct sk_buff *skb, void *data,
852 const struct flow_keys *keys, int hlen)
854 u32 poff = keys->control.thoff;
856 /* skip L4 headers for fragments after the first */
857 if ((keys->control.flags & FLOW_DIS_IS_FRAGMENT) &&
858 !(keys->control.flags & FLOW_DIS_FIRST_FRAG))
859 return poff;
861 switch (keys->basic.ip_proto) {
862 case IPPROTO_TCP: {
863 /* access doff as u8 to avoid unaligned access */
864 const u8 *doff;
865 u8 _doff;
867 doff = __skb_header_pointer(skb, poff + 12, sizeof(_doff),
868 data, hlen, &_doff);
869 if (!doff)
870 return poff;
872 poff += max_t(u32, sizeof(struct tcphdr), (*doff & 0xF0) >> 2);
873 break;
875 case IPPROTO_UDP:
876 case IPPROTO_UDPLITE:
877 poff += sizeof(struct udphdr);
878 break;
879 /* For the rest, we do not really care about header
880 * extensions at this point for now.
882 case IPPROTO_ICMP:
883 poff += sizeof(struct icmphdr);
884 break;
885 case IPPROTO_ICMPV6:
886 poff += sizeof(struct icmp6hdr);
887 break;
888 case IPPROTO_IGMP:
889 poff += sizeof(struct igmphdr);
890 break;
891 case IPPROTO_DCCP:
892 poff += sizeof(struct dccp_hdr);
893 break;
894 case IPPROTO_SCTP:
895 poff += sizeof(struct sctphdr);
896 break;
899 return poff;
903 * skb_get_poff - get the offset to the payload
904 * @skb: sk_buff to get the payload offset from
906 * The function will get the offset to the payload as far as it could
907 * be dissected. The main user is currently BPF, so that we can dynamically
908 * truncate packets without needing to push actual payload to the user
909 * space and can analyze headers only, instead.
911 u32 skb_get_poff(const struct sk_buff *skb)
913 struct flow_keys keys;
915 if (!skb_flow_dissect_flow_keys(skb, &keys, 0))
916 return 0;
918 return __skb_get_poff(skb, skb->data, &keys, skb_headlen(skb));
921 __u32 __get_hash_from_flowi6(const struct flowi6 *fl6, struct flow_keys *keys)
923 memset(keys, 0, sizeof(*keys));
925 memcpy(&keys->addrs.v6addrs.src, &fl6->saddr,
926 sizeof(keys->addrs.v6addrs.src));
927 memcpy(&keys->addrs.v6addrs.dst, &fl6->daddr,
928 sizeof(keys->addrs.v6addrs.dst));
929 keys->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
930 keys->ports.src = fl6->fl6_sport;
931 keys->ports.dst = fl6->fl6_dport;
932 keys->keyid.keyid = fl6->fl6_gre_key;
933 keys->tags.flow_label = (__force u32)fl6->flowlabel;
934 keys->basic.ip_proto = fl6->flowi6_proto;
936 return flow_hash_from_keys(keys);
938 EXPORT_SYMBOL(__get_hash_from_flowi6);
940 __u32 __get_hash_from_flowi4(const struct flowi4 *fl4, struct flow_keys *keys)
942 memset(keys, 0, sizeof(*keys));
944 keys->addrs.v4addrs.src = fl4->saddr;
945 keys->addrs.v4addrs.dst = fl4->daddr;
946 keys->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
947 keys->ports.src = fl4->fl4_sport;
948 keys->ports.dst = fl4->fl4_dport;
949 keys->keyid.keyid = fl4->fl4_gre_key;
950 keys->basic.ip_proto = fl4->flowi4_proto;
952 return flow_hash_from_keys(keys);
954 EXPORT_SYMBOL(__get_hash_from_flowi4);
956 static const struct flow_dissector_key flow_keys_dissector_keys[] = {
958 .key_id = FLOW_DISSECTOR_KEY_CONTROL,
959 .offset = offsetof(struct flow_keys, control),
962 .key_id = FLOW_DISSECTOR_KEY_BASIC,
963 .offset = offsetof(struct flow_keys, basic),
966 .key_id = FLOW_DISSECTOR_KEY_IPV4_ADDRS,
967 .offset = offsetof(struct flow_keys, addrs.v4addrs),
970 .key_id = FLOW_DISSECTOR_KEY_IPV6_ADDRS,
971 .offset = offsetof(struct flow_keys, addrs.v6addrs),
974 .key_id = FLOW_DISSECTOR_KEY_TIPC_ADDRS,
975 .offset = offsetof(struct flow_keys, addrs.tipcaddrs),
978 .key_id = FLOW_DISSECTOR_KEY_PORTS,
979 .offset = offsetof(struct flow_keys, ports),
982 .key_id = FLOW_DISSECTOR_KEY_VLAN,
983 .offset = offsetof(struct flow_keys, vlan),
986 .key_id = FLOW_DISSECTOR_KEY_FLOW_LABEL,
987 .offset = offsetof(struct flow_keys, tags),
990 .key_id = FLOW_DISSECTOR_KEY_GRE_KEYID,
991 .offset = offsetof(struct flow_keys, keyid),
995 static const struct flow_dissector_key flow_keys_dissector_symmetric_keys[] = {
997 .key_id = FLOW_DISSECTOR_KEY_CONTROL,
998 .offset = offsetof(struct flow_keys, control),
1001 .key_id = FLOW_DISSECTOR_KEY_BASIC,
1002 .offset = offsetof(struct flow_keys, basic),
1005 .key_id = FLOW_DISSECTOR_KEY_IPV4_ADDRS,
1006 .offset = offsetof(struct flow_keys, addrs.v4addrs),
1009 .key_id = FLOW_DISSECTOR_KEY_IPV6_ADDRS,
1010 .offset = offsetof(struct flow_keys, addrs.v6addrs),
1013 .key_id = FLOW_DISSECTOR_KEY_PORTS,
1014 .offset = offsetof(struct flow_keys, ports),
1018 static const struct flow_dissector_key flow_keys_buf_dissector_keys[] = {
1020 .key_id = FLOW_DISSECTOR_KEY_CONTROL,
1021 .offset = offsetof(struct flow_keys, control),
1024 .key_id = FLOW_DISSECTOR_KEY_BASIC,
1025 .offset = offsetof(struct flow_keys, basic),
1029 struct flow_dissector flow_keys_dissector __read_mostly;
1030 EXPORT_SYMBOL(flow_keys_dissector);
1032 struct flow_dissector flow_keys_buf_dissector __read_mostly;
1034 static int __init init_default_flow_dissectors(void)
1036 skb_flow_dissector_init(&flow_keys_dissector,
1037 flow_keys_dissector_keys,
1038 ARRAY_SIZE(flow_keys_dissector_keys));
1039 skb_flow_dissector_init(&flow_keys_dissector_symmetric,
1040 flow_keys_dissector_symmetric_keys,
1041 ARRAY_SIZE(flow_keys_dissector_symmetric_keys));
1042 skb_flow_dissector_init(&flow_keys_buf_dissector,
1043 flow_keys_buf_dissector_keys,
1044 ARRAY_SIZE(flow_keys_buf_dissector_keys));
1045 return 0;
1048 core_initcall(init_default_flow_dissectors);