2 * GENEVE: Generic Network Virtualization Encapsulation
4 * Copyright (c) 2015 Red Hat, Inc.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
11 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
13 #include <linux/kernel.h>
14 #include <linux/module.h>
15 #include <linux/etherdevice.h>
16 #include <linux/hash.h>
17 #include <net/dst_metadata.h>
18 #include <net/gro_cells.h>
19 #include <net/rtnetlink.h>
20 #include <net/geneve.h>
21 #include <net/protocol.h>
23 #define GENEVE_NETDEV_VER "0.6"
25 #define GENEVE_UDP_PORT 6081
27 #define GENEVE_N_VID (1u << 24)
28 #define GENEVE_VID_MASK (GENEVE_N_VID - 1)
30 #define VNI_HASH_BITS 10
31 #define VNI_HASH_SIZE (1<<VNI_HASH_BITS)
33 static bool log_ecn_error
= true;
34 module_param(log_ecn_error
, bool, 0644);
35 MODULE_PARM_DESC(log_ecn_error
, "Log packets received with corrupted ECN");
38 #define GENEVE_BASE_HLEN (sizeof(struct udphdr) + sizeof(struct genevehdr))
40 /* per-network namespace private data for this module */
42 struct list_head geneve_list
;
43 struct list_head sock_list
;
46 static int geneve_net_id
;
49 struct sockaddr_in sin
;
50 struct sockaddr_in6 sin6
;
54 static union geneve_addr geneve_remote_unspec
= { .sa
.sa_family
= AF_UNSPEC
, };
56 /* Pseudo network device */
58 struct hlist_node hlist
; /* vni hash table */
59 struct net
*net
; /* netns for packet i/o */
60 struct net_device
*dev
; /* netdev for geneve tunnel */
61 struct geneve_sock __rcu
*sock4
; /* IPv4 socket used for geneve tunnel */
62 #if IS_ENABLED(CONFIG_IPV6)
63 struct geneve_sock __rcu
*sock6
; /* IPv6 socket used for geneve tunnel */
65 u8 vni
[3]; /* virtual network ID for tunnel */
66 u8 ttl
; /* TTL override */
67 u8 tos
; /* TOS override */
68 union geneve_addr remote
; /* IP address for link partner */
69 struct list_head next
; /* geneve's per namespace list */
70 __be32 label
; /* IPv6 flowlabel override */
73 struct gro_cells gro_cells
;
75 struct dst_cache dst_cache
;
78 /* Geneve device flags */
79 #define GENEVE_F_UDP_ZERO_CSUM_TX BIT(0)
80 #define GENEVE_F_UDP_ZERO_CSUM6_TX BIT(1)
81 #define GENEVE_F_UDP_ZERO_CSUM6_RX BIT(2)
85 struct list_head list
;
89 struct hlist_head vni_list
[VNI_HASH_SIZE
];
93 static inline __u32
geneve_net_vni_hash(u8 vni
[3])
97 vnid
= (vni
[0] << 16) | (vni
[1] << 8) | vni
[2];
98 return hash_32(vnid
, VNI_HASH_BITS
);
101 static __be64
vni_to_tunnel_id(const __u8
*vni
)
104 return (vni
[0] << 16) | (vni
[1] << 8) | vni
[2];
106 return (__force __be64
)(((__force u64
)vni
[0] << 40) |
107 ((__force u64
)vni
[1] << 48) |
108 ((__force u64
)vni
[2] << 56));
112 static sa_family_t
geneve_get_sk_family(struct geneve_sock
*gs
)
114 return gs
->sock
->sk
->sk_family
;
117 static struct geneve_dev
*geneve_lookup(struct geneve_sock
*gs
,
118 __be32 addr
, u8 vni
[])
120 struct hlist_head
*vni_list_head
;
121 struct geneve_dev
*geneve
;
124 /* Find the device for this VNI */
125 hash
= geneve_net_vni_hash(vni
);
126 vni_list_head
= &gs
->vni_list
[hash
];
127 hlist_for_each_entry_rcu(geneve
, vni_list_head
, hlist
) {
128 if (!memcmp(vni
, geneve
->vni
, sizeof(geneve
->vni
)) &&
129 addr
== geneve
->remote
.sin
.sin_addr
.s_addr
)
135 #if IS_ENABLED(CONFIG_IPV6)
136 static struct geneve_dev
*geneve6_lookup(struct geneve_sock
*gs
,
137 struct in6_addr addr6
, u8 vni
[])
139 struct hlist_head
*vni_list_head
;
140 struct geneve_dev
*geneve
;
143 /* Find the device for this VNI */
144 hash
= geneve_net_vni_hash(vni
);
145 vni_list_head
= &gs
->vni_list
[hash
];
146 hlist_for_each_entry_rcu(geneve
, vni_list_head
, hlist
) {
147 if (!memcmp(vni
, geneve
->vni
, sizeof(geneve
->vni
)) &&
148 ipv6_addr_equal(&addr6
, &geneve
->remote
.sin6
.sin6_addr
))
155 static inline struct genevehdr
*geneve_hdr(const struct sk_buff
*skb
)
157 return (struct genevehdr
*)(udp_hdr(skb
) + 1);
160 static struct geneve_dev
*geneve_lookup_skb(struct geneve_sock
*gs
,
165 static u8 zero_vni
[3];
166 #if IS_ENABLED(CONFIG_IPV6)
167 static struct in6_addr zero_addr6
;
170 if (geneve_get_sk_family(gs
) == AF_INET
) {
173 iph
= ip_hdr(skb
); /* outer IP header... */
175 if (gs
->collect_md
) {
179 vni
= geneve_hdr(skb
)->vni
;
183 return geneve_lookup(gs
, addr
, vni
);
184 #if IS_ENABLED(CONFIG_IPV6)
185 } else if (geneve_get_sk_family(gs
) == AF_INET6
) {
186 struct ipv6hdr
*ip6h
;
187 struct in6_addr addr6
;
189 ip6h
= ipv6_hdr(skb
); /* outer IPv6 header... */
191 if (gs
->collect_md
) {
195 vni
= geneve_hdr(skb
)->vni
;
199 return geneve6_lookup(gs
, addr6
, vni
);
205 /* geneve receive/decap routine */
206 static void geneve_rx(struct geneve_dev
*geneve
, struct geneve_sock
*gs
,
209 struct genevehdr
*gnvh
= geneve_hdr(skb
);
210 struct metadata_dst
*tun_dst
= NULL
;
211 struct pcpu_sw_netstats
*stats
;
216 if (ip_tunnel_collect_metadata() || gs
->collect_md
) {
219 flags
= TUNNEL_KEY
| TUNNEL_GENEVE_OPT
|
220 (gnvh
->oam
? TUNNEL_OAM
: 0) |
221 (gnvh
->critical
? TUNNEL_CRIT_OPT
: 0);
223 tun_dst
= udp_tun_rx_dst(skb
, geneve_get_sk_family(gs
), flags
,
224 vni_to_tunnel_id(gnvh
->vni
),
227 geneve
->dev
->stats
.rx_dropped
++;
230 /* Update tunnel dst according to Geneve options. */
231 ip_tunnel_info_opts_set(&tun_dst
->u
.tun_info
,
232 gnvh
->options
, gnvh
->opt_len
* 4);
234 /* Drop packets w/ critical options,
235 * since we don't support any...
237 if (gnvh
->critical
) {
238 geneve
->dev
->stats
.rx_frame_errors
++;
239 geneve
->dev
->stats
.rx_errors
++;
244 skb_reset_mac_header(skb
);
245 skb
->protocol
= eth_type_trans(skb
, geneve
->dev
);
246 skb_postpull_rcsum(skb
, eth_hdr(skb
), ETH_HLEN
);
249 skb_dst_set(skb
, &tun_dst
->dst
);
251 /* Ignore packet loops (and multicast echo) */
252 if (ether_addr_equal(eth_hdr(skb
)->h_source
, geneve
->dev
->dev_addr
)) {
253 geneve
->dev
->stats
.rx_errors
++;
257 oiph
= skb_network_header(skb
);
258 skb_reset_network_header(skb
);
260 if (geneve_get_sk_family(gs
) == AF_INET
)
261 err
= IP_ECN_decapsulate(oiph
, skb
);
262 #if IS_ENABLED(CONFIG_IPV6)
264 err
= IP6_ECN_decapsulate(oiph
, skb
);
269 if (geneve_get_sk_family(gs
) == AF_INET
)
270 net_info_ratelimited("non-ECT from %pI4 "
272 &((struct iphdr
*)oiph
)->saddr
,
273 ((struct iphdr
*)oiph
)->tos
);
274 #if IS_ENABLED(CONFIG_IPV6)
276 net_info_ratelimited("non-ECT from %pI6\n",
277 &((struct ipv6hdr
*)oiph
)->saddr
);
281 ++geneve
->dev
->stats
.rx_frame_errors
;
282 ++geneve
->dev
->stats
.rx_errors
;
288 err
= gro_cells_receive(&geneve
->gro_cells
, skb
);
289 if (likely(err
== NET_RX_SUCCESS
)) {
290 stats
= this_cpu_ptr(geneve
->dev
->tstats
);
291 u64_stats_update_begin(&stats
->syncp
);
293 stats
->rx_bytes
+= len
;
294 u64_stats_update_end(&stats
->syncp
);
298 /* Consume bad packet */
302 /* Setup stats when device is created */
303 static int geneve_init(struct net_device
*dev
)
305 struct geneve_dev
*geneve
= netdev_priv(dev
);
308 dev
->tstats
= netdev_alloc_pcpu_stats(struct pcpu_sw_netstats
);
312 err
= gro_cells_init(&geneve
->gro_cells
, dev
);
314 free_percpu(dev
->tstats
);
318 err
= dst_cache_init(&geneve
->dst_cache
, GFP_KERNEL
);
320 free_percpu(dev
->tstats
);
321 gro_cells_destroy(&geneve
->gro_cells
);
328 static void geneve_uninit(struct net_device
*dev
)
330 struct geneve_dev
*geneve
= netdev_priv(dev
);
332 dst_cache_destroy(&geneve
->dst_cache
);
333 gro_cells_destroy(&geneve
->gro_cells
);
334 free_percpu(dev
->tstats
);
337 /* Callback from net/ipv4/udp.c to receive packets */
338 static int geneve_udp_encap_recv(struct sock
*sk
, struct sk_buff
*skb
)
340 struct genevehdr
*geneveh
;
341 struct geneve_dev
*geneve
;
342 struct geneve_sock
*gs
;
345 /* Need UDP and Geneve header to be present */
346 if (unlikely(!pskb_may_pull(skb
, GENEVE_BASE_HLEN
)))
349 /* Return packets with reserved bits set */
350 geneveh
= geneve_hdr(skb
);
351 if (unlikely(geneveh
->ver
!= GENEVE_VER
))
354 if (unlikely(geneveh
->proto_type
!= htons(ETH_P_TEB
)))
357 gs
= rcu_dereference_sk_user_data(sk
);
361 geneve
= geneve_lookup_skb(gs
, skb
);
365 opts_len
= geneveh
->opt_len
* 4;
366 if (iptunnel_pull_header(skb
, GENEVE_BASE_HLEN
+ opts_len
,
368 !net_eq(geneve
->net
, dev_net(geneve
->dev
)))) {
369 geneve
->dev
->stats
.rx_dropped
++;
373 geneve_rx(geneve
, gs
, skb
);
377 /* Consume bad packet */
382 static struct socket
*geneve_create_sock(struct net
*net
, bool ipv6
,
383 __be16 port
, u32 flags
)
386 struct udp_port_cfg udp_conf
;
389 memset(&udp_conf
, 0, sizeof(udp_conf
));
392 udp_conf
.family
= AF_INET6
;
393 udp_conf
.ipv6_v6only
= 1;
394 udp_conf
.use_udp6_rx_checksums
=
395 !(flags
& GENEVE_F_UDP_ZERO_CSUM6_RX
);
397 udp_conf
.family
= AF_INET
;
398 udp_conf
.local_ip
.s_addr
= htonl(INADDR_ANY
);
401 udp_conf
.local_udp_port
= port
;
403 /* Open UDP socket */
404 err
= udp_sock_create(net
, &udp_conf
, &sock
);
411 static int geneve_hlen(struct genevehdr
*gh
)
413 return sizeof(*gh
) + gh
->opt_len
* 4;
416 static struct sk_buff
**geneve_gro_receive(struct sock
*sk
,
417 struct sk_buff
**head
,
420 struct sk_buff
*p
, **pp
= NULL
;
421 struct genevehdr
*gh
, *gh2
;
422 unsigned int hlen
, gh_len
, off_gnv
;
423 const struct packet_offload
*ptype
;
427 off_gnv
= skb_gro_offset(skb
);
428 hlen
= off_gnv
+ sizeof(*gh
);
429 gh
= skb_gro_header_fast(skb
, off_gnv
);
430 if (skb_gro_header_hard(skb
, hlen
)) {
431 gh
= skb_gro_header_slow(skb
, hlen
, off_gnv
);
436 if (gh
->ver
!= GENEVE_VER
|| gh
->oam
)
438 gh_len
= geneve_hlen(gh
);
440 hlen
= off_gnv
+ gh_len
;
441 if (skb_gro_header_hard(skb
, hlen
)) {
442 gh
= skb_gro_header_slow(skb
, hlen
, off_gnv
);
447 for (p
= *head
; p
; p
= p
->next
) {
448 if (!NAPI_GRO_CB(p
)->same_flow
)
451 gh2
= (struct genevehdr
*)(p
->data
+ off_gnv
);
452 if (gh
->opt_len
!= gh2
->opt_len
||
453 memcmp(gh
, gh2
, gh_len
)) {
454 NAPI_GRO_CB(p
)->same_flow
= 0;
459 type
= gh
->proto_type
;
462 ptype
= gro_find_receive_by_type(type
);
466 skb_gro_pull(skb
, gh_len
);
467 skb_gro_postpull_rcsum(skb
, gh
, gh_len
);
468 pp
= call_gro_receive(ptype
->callbacks
.gro_receive
, head
, skb
);
474 NAPI_GRO_CB(skb
)->flush
|= flush
;
479 static int geneve_gro_complete(struct sock
*sk
, struct sk_buff
*skb
,
482 struct genevehdr
*gh
;
483 struct packet_offload
*ptype
;
488 gh
= (struct genevehdr
*)(skb
->data
+ nhoff
);
489 gh_len
= geneve_hlen(gh
);
490 type
= gh
->proto_type
;
493 ptype
= gro_find_complete_by_type(type
);
495 err
= ptype
->callbacks
.gro_complete(skb
, nhoff
+ gh_len
);
499 skb_set_inner_mac_header(skb
, nhoff
+ gh_len
);
504 /* Create new listen socket if needed */
505 static struct geneve_sock
*geneve_socket_create(struct net
*net
, __be16 port
,
506 bool ipv6
, u32 flags
)
508 struct geneve_net
*gn
= net_generic(net
, geneve_net_id
);
509 struct geneve_sock
*gs
;
511 struct udp_tunnel_sock_cfg tunnel_cfg
;
514 gs
= kzalloc(sizeof(*gs
), GFP_KERNEL
);
516 return ERR_PTR(-ENOMEM
);
518 sock
= geneve_create_sock(net
, ipv6
, port
, flags
);
521 return ERR_CAST(sock
);
526 for (h
= 0; h
< VNI_HASH_SIZE
; ++h
)
527 INIT_HLIST_HEAD(&gs
->vni_list
[h
]);
529 /* Initialize the geneve udp offloads structure */
530 udp_tunnel_notify_add_rx_port(gs
->sock
, UDP_TUNNEL_TYPE_GENEVE
);
532 /* Mark socket as an encapsulation socket */
533 memset(&tunnel_cfg
, 0, sizeof(tunnel_cfg
));
534 tunnel_cfg
.sk_user_data
= gs
;
535 tunnel_cfg
.encap_type
= 1;
536 tunnel_cfg
.gro_receive
= geneve_gro_receive
;
537 tunnel_cfg
.gro_complete
= geneve_gro_complete
;
538 tunnel_cfg
.encap_rcv
= geneve_udp_encap_recv
;
539 tunnel_cfg
.encap_destroy
= NULL
;
540 setup_udp_tunnel_sock(net
, sock
, &tunnel_cfg
);
541 list_add(&gs
->list
, &gn
->sock_list
);
545 static void __geneve_sock_release(struct geneve_sock
*gs
)
547 if (!gs
|| --gs
->refcnt
)
551 udp_tunnel_notify_del_rx_port(gs
->sock
, UDP_TUNNEL_TYPE_GENEVE
);
552 udp_tunnel_sock_release(gs
->sock
);
556 static void geneve_sock_release(struct geneve_dev
*geneve
)
558 struct geneve_sock
*gs4
= rtnl_dereference(geneve
->sock4
);
559 #if IS_ENABLED(CONFIG_IPV6)
560 struct geneve_sock
*gs6
= rtnl_dereference(geneve
->sock6
);
562 rcu_assign_pointer(geneve
->sock6
, NULL
);
565 rcu_assign_pointer(geneve
->sock4
, NULL
);
568 __geneve_sock_release(gs4
);
569 #if IS_ENABLED(CONFIG_IPV6)
570 __geneve_sock_release(gs6
);
574 static struct geneve_sock
*geneve_find_sock(struct geneve_net
*gn
,
578 struct geneve_sock
*gs
;
580 list_for_each_entry(gs
, &gn
->sock_list
, list
) {
581 if (inet_sk(gs
->sock
->sk
)->inet_sport
== dst_port
&&
582 geneve_get_sk_family(gs
) == family
) {
589 static int geneve_sock_add(struct geneve_dev
*geneve
, bool ipv6
)
591 struct net
*net
= geneve
->net
;
592 struct geneve_net
*gn
= net_generic(net
, geneve_net_id
);
593 struct geneve_sock
*gs
;
596 gs
= geneve_find_sock(gn
, ipv6
? AF_INET6
: AF_INET
, geneve
->dst_port
);
602 gs
= geneve_socket_create(net
, geneve
->dst_port
, ipv6
, geneve
->flags
);
607 gs
->collect_md
= geneve
->collect_md
;
608 gs
->flags
= geneve
->flags
;
609 #if IS_ENABLED(CONFIG_IPV6)
611 rcu_assign_pointer(geneve
->sock6
, gs
);
614 rcu_assign_pointer(geneve
->sock4
, gs
);
616 hash
= geneve_net_vni_hash(geneve
->vni
);
617 hlist_add_head_rcu(&geneve
->hlist
, &gs
->vni_list
[hash
]);
621 static int geneve_open(struct net_device
*dev
)
623 struct geneve_dev
*geneve
= netdev_priv(dev
);
624 bool ipv6
= geneve
->remote
.sa
.sa_family
== AF_INET6
;
625 bool metadata
= geneve
->collect_md
;
628 #if IS_ENABLED(CONFIG_IPV6)
629 if (ipv6
|| metadata
)
630 ret
= geneve_sock_add(geneve
, true);
632 if (!ret
&& (!ipv6
|| metadata
))
633 ret
= geneve_sock_add(geneve
, false);
635 geneve_sock_release(geneve
);
640 static int geneve_stop(struct net_device
*dev
)
642 struct geneve_dev
*geneve
= netdev_priv(dev
);
644 if (!hlist_unhashed(&geneve
->hlist
))
645 hlist_del_rcu(&geneve
->hlist
);
646 geneve_sock_release(geneve
);
650 static void geneve_build_header(struct genevehdr
*geneveh
,
651 __be16 tun_flags
, u8 vni
[3],
652 u8 options_len
, u8
*options
)
654 geneveh
->ver
= GENEVE_VER
;
655 geneveh
->opt_len
= options_len
/ 4;
656 geneveh
->oam
= !!(tun_flags
& TUNNEL_OAM
);
657 geneveh
->critical
= !!(tun_flags
& TUNNEL_CRIT_OPT
);
659 memcpy(geneveh
->vni
, vni
, 3);
660 geneveh
->proto_type
= htons(ETH_P_TEB
);
663 memcpy(geneveh
->options
, options
, options_len
);
666 static int geneve_build_skb(struct rtable
*rt
, struct sk_buff
*skb
,
667 __be16 tun_flags
, u8 vni
[3], u8 opt_len
, u8
*opt
,
668 u32 flags
, bool xnet
)
670 struct genevehdr
*gnvh
;
673 bool udp_sum
= !(flags
& GENEVE_F_UDP_ZERO_CSUM_TX
);
675 skb_scrub_packet(skb
, xnet
);
677 min_headroom
= LL_RESERVED_SPACE(rt
->dst
.dev
) + rt
->dst
.header_len
678 + GENEVE_BASE_HLEN
+ opt_len
+ sizeof(struct iphdr
);
679 err
= skb_cow_head(skb
, min_headroom
);
683 err
= udp_tunnel_handle_offloads(skb
, udp_sum
);
687 gnvh
= (struct genevehdr
*)__skb_push(skb
, sizeof(*gnvh
) + opt_len
);
688 geneve_build_header(gnvh
, tun_flags
, vni
, opt_len
, opt
);
690 skb_set_inner_protocol(skb
, htons(ETH_P_TEB
));
698 #if IS_ENABLED(CONFIG_IPV6)
699 static int geneve6_build_skb(struct dst_entry
*dst
, struct sk_buff
*skb
,
700 __be16 tun_flags
, u8 vni
[3], u8 opt_len
, u8
*opt
,
701 u32 flags
, bool xnet
)
703 struct genevehdr
*gnvh
;
706 bool udp_sum
= !(flags
& GENEVE_F_UDP_ZERO_CSUM6_TX
);
708 skb_scrub_packet(skb
, xnet
);
710 min_headroom
= LL_RESERVED_SPACE(dst
->dev
) + dst
->header_len
711 + GENEVE_BASE_HLEN
+ opt_len
+ sizeof(struct ipv6hdr
);
712 err
= skb_cow_head(skb
, min_headroom
);
716 err
= udp_tunnel_handle_offloads(skb
, udp_sum
);
720 gnvh
= (struct genevehdr
*)__skb_push(skb
, sizeof(*gnvh
) + opt_len
);
721 geneve_build_header(gnvh
, tun_flags
, vni
, opt_len
, opt
);
723 skb_set_inner_protocol(skb
, htons(ETH_P_TEB
));
732 static struct rtable
*geneve_get_v4_rt(struct sk_buff
*skb
,
733 struct net_device
*dev
,
735 struct ip_tunnel_info
*info
)
737 bool use_cache
= ip_tunnel_dst_cache_usable(skb
, info
);
738 struct geneve_dev
*geneve
= netdev_priv(dev
);
739 struct dst_cache
*dst_cache
;
740 struct rtable
*rt
= NULL
;
743 if (!rcu_dereference(geneve
->sock4
))
744 return ERR_PTR(-EIO
);
746 memset(fl4
, 0, sizeof(*fl4
));
747 fl4
->flowi4_mark
= skb
->mark
;
748 fl4
->flowi4_proto
= IPPROTO_UDP
;
751 fl4
->daddr
= info
->key
.u
.ipv4
.dst
;
752 fl4
->saddr
= info
->key
.u
.ipv4
.src
;
753 fl4
->flowi4_tos
= RT_TOS(info
->key
.tos
);
754 dst_cache
= &info
->dst_cache
;
758 const struct iphdr
*iip
= ip_hdr(skb
);
760 tos
= ip_tunnel_get_dsfield(iip
, skb
);
764 fl4
->flowi4_tos
= RT_TOS(tos
);
765 fl4
->daddr
= geneve
->remote
.sin
.sin_addr
.s_addr
;
766 dst_cache
= &geneve
->dst_cache
;
770 rt
= dst_cache_get_ip4(dst_cache
, &fl4
->saddr
);
775 rt
= ip_route_output_key(geneve
->net
, fl4
);
777 netdev_dbg(dev
, "no route to %pI4\n", &fl4
->daddr
);
778 return ERR_PTR(-ENETUNREACH
);
780 if (rt
->dst
.dev
== dev
) { /* is this necessary? */
781 netdev_dbg(dev
, "circular route to %pI4\n", &fl4
->daddr
);
783 return ERR_PTR(-ELOOP
);
786 dst_cache_set_ip4(dst_cache
, &rt
->dst
, fl4
->saddr
);
790 #if IS_ENABLED(CONFIG_IPV6)
791 static struct dst_entry
*geneve_get_v6_dst(struct sk_buff
*skb
,
792 struct net_device
*dev
,
794 struct ip_tunnel_info
*info
)
796 bool use_cache
= ip_tunnel_dst_cache_usable(skb
, info
);
797 struct geneve_dev
*geneve
= netdev_priv(dev
);
798 struct dst_entry
*dst
= NULL
;
799 struct dst_cache
*dst_cache
;
800 struct geneve_sock
*gs6
;
803 gs6
= rcu_dereference(geneve
->sock6
);
805 return ERR_PTR(-EIO
);
807 memset(fl6
, 0, sizeof(*fl6
));
808 fl6
->flowi6_mark
= skb
->mark
;
809 fl6
->flowi6_proto
= IPPROTO_UDP
;
812 fl6
->daddr
= info
->key
.u
.ipv6
.dst
;
813 fl6
->saddr
= info
->key
.u
.ipv6
.src
;
814 fl6
->flowlabel
= ip6_make_flowinfo(RT_TOS(info
->key
.tos
),
816 dst_cache
= &info
->dst_cache
;
820 const struct iphdr
*iip
= ip_hdr(skb
);
822 prio
= ip_tunnel_get_dsfield(iip
, skb
);
826 fl6
->flowlabel
= ip6_make_flowinfo(RT_TOS(prio
),
828 fl6
->daddr
= geneve
->remote
.sin6
.sin6_addr
;
829 dst_cache
= &geneve
->dst_cache
;
833 dst
= dst_cache_get_ip6(dst_cache
, &fl6
->saddr
);
838 if (ipv6_stub
->ipv6_dst_lookup(geneve
->net
, gs6
->sock
->sk
, &dst
, fl6
)) {
839 netdev_dbg(dev
, "no route to %pI6\n", &fl6
->daddr
);
840 return ERR_PTR(-ENETUNREACH
);
842 if (dst
->dev
== dev
) { /* is this necessary? */
843 netdev_dbg(dev
, "circular route to %pI6\n", &fl6
->daddr
);
845 return ERR_PTR(-ELOOP
);
849 dst_cache_set_ip6(dst_cache
, dst
, &fl6
->saddr
);
854 /* Convert 64 bit tunnel ID to 24 bit VNI. */
855 static void tunnel_id_to_vni(__be64 tun_id
, __u8
*vni
)
858 vni
[0] = (__force __u8
)(tun_id
>> 16);
859 vni
[1] = (__force __u8
)(tun_id
>> 8);
860 vni
[2] = (__force __u8
)tun_id
;
862 vni
[0] = (__force __u8
)((__force u64
)tun_id
>> 40);
863 vni
[1] = (__force __u8
)((__force u64
)tun_id
>> 48);
864 vni
[2] = (__force __u8
)((__force u64
)tun_id
>> 56);
868 static netdev_tx_t
geneve_xmit_skb(struct sk_buff
*skb
, struct net_device
*dev
,
869 struct ip_tunnel_info
*info
)
871 struct geneve_dev
*geneve
= netdev_priv(dev
);
872 struct geneve_sock
*gs4
;
873 struct rtable
*rt
= NULL
;
879 bool xnet
= !net_eq(geneve
->net
, dev_net(geneve
->dev
));
880 u32 flags
= geneve
->flags
;
882 gs4
= rcu_dereference(geneve
->sock4
);
886 if (geneve
->collect_md
) {
887 if (unlikely(!info
|| !(info
->mode
& IP_TUNNEL_INFO_TX
))) {
888 netdev_dbg(dev
, "no tunnel metadata\n");
891 if (info
&& ip_tunnel_info_af(info
) != AF_INET
)
895 rt
= geneve_get_v4_rt(skb
, dev
, &fl4
, info
);
901 sport
= udp_flow_src_port(geneve
->net
, skb
, 1, USHRT_MAX
, true);
902 skb_reset_mac_header(skb
);
905 const struct ip_tunnel_key
*key
= &info
->key
;
909 tunnel_id_to_vni(key
->tun_id
, vni
);
910 if (info
->options_len
)
911 opts
= ip_tunnel_info_opts(info
);
913 if (key
->tun_flags
& TUNNEL_CSUM
)
914 flags
&= ~GENEVE_F_UDP_ZERO_CSUM_TX
;
916 flags
|= GENEVE_F_UDP_ZERO_CSUM_TX
;
918 err
= geneve_build_skb(rt
, skb
, key
->tun_flags
, vni
,
919 info
->options_len
, opts
, flags
, xnet
);
923 tos
= ip_tunnel_ecn_encap(key
->tos
, ip_hdr(skb
), skb
);
925 df
= key
->tun_flags
& TUNNEL_DONT_FRAGMENT
? htons(IP_DF
) : 0;
927 err
= geneve_build_skb(rt
, skb
, 0, geneve
->vni
,
928 0, NULL
, flags
, xnet
);
932 tos
= ip_tunnel_ecn_encap(fl4
.flowi4_tos
, ip_hdr(skb
), skb
);
934 if (!ttl
&& IN_MULTICAST(ntohl(fl4
.daddr
)))
936 ttl
= ttl
? : ip4_dst_hoplimit(&rt
->dst
);
939 udp_tunnel_xmit_skb(rt
, gs4
->sock
->sk
, skb
, fl4
.saddr
, fl4
.daddr
,
940 tos
, ttl
, df
, sport
, geneve
->dst_port
,
941 !net_eq(geneve
->net
, dev_net(geneve
->dev
)),
942 !!(flags
& GENEVE_F_UDP_ZERO_CSUM_TX
));
950 dev
->stats
.collisions
++;
951 else if (err
== -ENETUNREACH
)
952 dev
->stats
.tx_carrier_errors
++;
954 dev
->stats
.tx_errors
++;
958 #if IS_ENABLED(CONFIG_IPV6)
959 static netdev_tx_t
geneve6_xmit_skb(struct sk_buff
*skb
, struct net_device
*dev
,
960 struct ip_tunnel_info
*info
)
962 struct geneve_dev
*geneve
= netdev_priv(dev
);
963 struct dst_entry
*dst
= NULL
;
964 struct geneve_sock
*gs6
;
970 bool xnet
= !net_eq(geneve
->net
, dev_net(geneve
->dev
));
971 u32 flags
= geneve
->flags
;
973 gs6
= rcu_dereference(geneve
->sock6
);
977 if (geneve
->collect_md
) {
978 if (unlikely(!info
|| !(info
->mode
& IP_TUNNEL_INFO_TX
))) {
979 netdev_dbg(dev
, "no tunnel metadata\n");
984 dst
= geneve_get_v6_dst(skb
, dev
, &fl6
, info
);
990 sport
= udp_flow_src_port(geneve
->net
, skb
, 1, USHRT_MAX
, true);
991 skb_reset_mac_header(skb
);
994 const struct ip_tunnel_key
*key
= &info
->key
;
998 tunnel_id_to_vni(key
->tun_id
, vni
);
999 if (info
->options_len
)
1000 opts
= ip_tunnel_info_opts(info
);
1002 if (key
->tun_flags
& TUNNEL_CSUM
)
1003 flags
&= ~GENEVE_F_UDP_ZERO_CSUM6_TX
;
1005 flags
|= GENEVE_F_UDP_ZERO_CSUM6_TX
;
1007 err
= geneve6_build_skb(dst
, skb
, key
->tun_flags
, vni
,
1008 info
->options_len
, opts
,
1013 prio
= ip_tunnel_ecn_encap(key
->tos
, ip_hdr(skb
), skb
);
1015 label
= info
->key
.label
;
1017 err
= geneve6_build_skb(dst
, skb
, 0, geneve
->vni
,
1018 0, NULL
, flags
, xnet
);
1022 prio
= ip_tunnel_ecn_encap(ip6_tclass(fl6
.flowlabel
),
1025 if (!ttl
&& ipv6_addr_is_multicast(&fl6
.daddr
))
1027 ttl
= ttl
? : ip6_dst_hoplimit(dst
);
1028 label
= geneve
->label
;
1031 udp_tunnel6_xmit_skb(dst
, gs6
->sock
->sk
, skb
, dev
,
1032 &fl6
.saddr
, &fl6
.daddr
, prio
, ttl
, label
,
1033 sport
, geneve
->dst_port
,
1034 !!(flags
& GENEVE_F_UDP_ZERO_CSUM6_TX
));
1035 return NETDEV_TX_OK
;
1041 dev
->stats
.collisions
++;
1042 else if (err
== -ENETUNREACH
)
1043 dev
->stats
.tx_carrier_errors
++;
1045 dev
->stats
.tx_errors
++;
1046 return NETDEV_TX_OK
;
1050 static netdev_tx_t
geneve_xmit(struct sk_buff
*skb
, struct net_device
*dev
)
1052 struct geneve_dev
*geneve
= netdev_priv(dev
);
1053 struct ip_tunnel_info
*info
= NULL
;
1056 if (geneve
->collect_md
)
1057 info
= skb_tunnel_info(skb
);
1060 #if IS_ENABLED(CONFIG_IPV6)
1061 if ((info
&& ip_tunnel_info_af(info
) == AF_INET6
) ||
1062 (!info
&& geneve
->remote
.sa
.sa_family
== AF_INET6
))
1063 err
= geneve6_xmit_skb(skb
, dev
, info
);
1066 err
= geneve_xmit_skb(skb
, dev
, info
);
1072 static int __geneve_change_mtu(struct net_device
*dev
, int new_mtu
, bool strict
)
1074 struct geneve_dev
*geneve
= netdev_priv(dev
);
1075 /* The max_mtu calculation does not take account of GENEVE
1076 * options, to avoid excluding potentially valid
1079 int max_mtu
= IP_MAX_MTU
- GENEVE_BASE_HLEN
- dev
->hard_header_len
;
1081 if (geneve
->remote
.sa
.sa_family
== AF_INET6
)
1082 max_mtu
-= sizeof(struct ipv6hdr
);
1084 max_mtu
-= sizeof(struct iphdr
);
1089 if (new_mtu
> max_mtu
) {
1100 static int geneve_change_mtu(struct net_device
*dev
, int new_mtu
)
1102 return __geneve_change_mtu(dev
, new_mtu
, true);
1105 static int geneve_fill_metadata_dst(struct net_device
*dev
, struct sk_buff
*skb
)
1107 struct ip_tunnel_info
*info
= skb_tunnel_info(skb
);
1108 struct geneve_dev
*geneve
= netdev_priv(dev
);
1111 #if IS_ENABLED(CONFIG_IPV6)
1112 struct dst_entry
*dst
;
1116 if (ip_tunnel_info_af(info
) == AF_INET
) {
1117 rt
= geneve_get_v4_rt(skb
, dev
, &fl4
, info
);
1122 info
->key
.u
.ipv4
.src
= fl4
.saddr
;
1123 #if IS_ENABLED(CONFIG_IPV6)
1124 } else if (ip_tunnel_info_af(info
) == AF_INET6
) {
1125 dst
= geneve_get_v6_dst(skb
, dev
, &fl6
, info
);
1127 return PTR_ERR(dst
);
1130 info
->key
.u
.ipv6
.src
= fl6
.saddr
;
1136 info
->key
.tp_src
= udp_flow_src_port(geneve
->net
, skb
,
1137 1, USHRT_MAX
, true);
1138 info
->key
.tp_dst
= geneve
->dst_port
;
1142 static const struct net_device_ops geneve_netdev_ops
= {
1143 .ndo_init
= geneve_init
,
1144 .ndo_uninit
= geneve_uninit
,
1145 .ndo_open
= geneve_open
,
1146 .ndo_stop
= geneve_stop
,
1147 .ndo_start_xmit
= geneve_xmit
,
1148 .ndo_get_stats64
= ip_tunnel_get_stats64
,
1149 .ndo_change_mtu
= geneve_change_mtu
,
1150 .ndo_validate_addr
= eth_validate_addr
,
1151 .ndo_set_mac_address
= eth_mac_addr
,
1152 .ndo_fill_metadata_dst
= geneve_fill_metadata_dst
,
1155 static void geneve_get_drvinfo(struct net_device
*dev
,
1156 struct ethtool_drvinfo
*drvinfo
)
1158 strlcpy(drvinfo
->version
, GENEVE_NETDEV_VER
, sizeof(drvinfo
->version
));
1159 strlcpy(drvinfo
->driver
, "geneve", sizeof(drvinfo
->driver
));
1162 static const struct ethtool_ops geneve_ethtool_ops
= {
1163 .get_drvinfo
= geneve_get_drvinfo
,
1164 .get_link
= ethtool_op_get_link
,
1167 /* Info for udev, that this is a virtual tunnel endpoint */
1168 static struct device_type geneve_type
= {
1172 /* Calls the ndo_udp_tunnel_add of the caller in order to
1173 * supply the listening GENEVE udp ports. Callers are expected
1174 * to implement the ndo_udp_tunnel_add.
1176 static void geneve_push_rx_ports(struct net_device
*dev
)
1178 struct net
*net
= dev_net(dev
);
1179 struct geneve_net
*gn
= net_generic(net
, geneve_net_id
);
1180 struct geneve_sock
*gs
;
1183 list_for_each_entry_rcu(gs
, &gn
->sock_list
, list
)
1184 udp_tunnel_push_rx_port(dev
, gs
->sock
,
1185 UDP_TUNNEL_TYPE_GENEVE
);
1189 /* Initialize the device structure. */
1190 static void geneve_setup(struct net_device
*dev
)
1194 dev
->netdev_ops
= &geneve_netdev_ops
;
1195 dev
->ethtool_ops
= &geneve_ethtool_ops
;
1196 dev
->destructor
= free_netdev
;
1198 SET_NETDEV_DEVTYPE(dev
, &geneve_type
);
1200 dev
->features
|= NETIF_F_LLTX
;
1201 dev
->features
|= NETIF_F_SG
| NETIF_F_HW_CSUM
;
1202 dev
->features
|= NETIF_F_RXCSUM
;
1203 dev
->features
|= NETIF_F_GSO_SOFTWARE
;
1205 dev
->hw_features
|= NETIF_F_SG
| NETIF_F_HW_CSUM
| NETIF_F_RXCSUM
;
1206 dev
->hw_features
|= NETIF_F_GSO_SOFTWARE
;
1208 netif_keep_dst(dev
);
1209 dev
->priv_flags
&= ~IFF_TX_SKB_SHARING
;
1210 dev
->priv_flags
|= IFF_LIVE_ADDR_CHANGE
| IFF_NO_QUEUE
;
1211 eth_hw_addr_random(dev
);
1214 static const struct nla_policy geneve_policy
[IFLA_GENEVE_MAX
+ 1] = {
1215 [IFLA_GENEVE_ID
] = { .type
= NLA_U32
},
1216 [IFLA_GENEVE_REMOTE
] = { .len
= FIELD_SIZEOF(struct iphdr
, daddr
) },
1217 [IFLA_GENEVE_REMOTE6
] = { .len
= sizeof(struct in6_addr
) },
1218 [IFLA_GENEVE_TTL
] = { .type
= NLA_U8
},
1219 [IFLA_GENEVE_TOS
] = { .type
= NLA_U8
},
1220 [IFLA_GENEVE_LABEL
] = { .type
= NLA_U32
},
1221 [IFLA_GENEVE_PORT
] = { .type
= NLA_U16
},
1222 [IFLA_GENEVE_COLLECT_METADATA
] = { .type
= NLA_FLAG
},
1223 [IFLA_GENEVE_UDP_CSUM
] = { .type
= NLA_U8
},
1224 [IFLA_GENEVE_UDP_ZERO_CSUM6_TX
] = { .type
= NLA_U8
},
1225 [IFLA_GENEVE_UDP_ZERO_CSUM6_RX
] = { .type
= NLA_U8
},
1228 static int geneve_validate(struct nlattr
*tb
[], struct nlattr
*data
[])
1230 if (tb
[IFLA_ADDRESS
]) {
1231 if (nla_len(tb
[IFLA_ADDRESS
]) != ETH_ALEN
)
1234 if (!is_valid_ether_addr(nla_data(tb
[IFLA_ADDRESS
])))
1235 return -EADDRNOTAVAIL
;
1241 if (data
[IFLA_GENEVE_ID
]) {
1242 __u32 vni
= nla_get_u32(data
[IFLA_GENEVE_ID
]);
1244 if (vni
>= GENEVE_VID_MASK
)
1251 static struct geneve_dev
*geneve_find_dev(struct geneve_net
*gn
,
1253 union geneve_addr
*remote
,
1255 bool *tun_on_same_port
,
1256 bool *tun_collect_md
)
1258 struct geneve_dev
*geneve
, *t
;
1260 *tun_on_same_port
= false;
1261 *tun_collect_md
= false;
1263 list_for_each_entry(geneve
, &gn
->geneve_list
, next
) {
1264 if (geneve
->dst_port
== dst_port
) {
1265 *tun_collect_md
= geneve
->collect_md
;
1266 *tun_on_same_port
= true;
1268 if (!memcmp(vni
, geneve
->vni
, sizeof(geneve
->vni
)) &&
1269 !memcmp(remote
, &geneve
->remote
, sizeof(geneve
->remote
)) &&
1270 dst_port
== geneve
->dst_port
)
1276 static int geneve_configure(struct net
*net
, struct net_device
*dev
,
1277 union geneve_addr
*remote
,
1278 __u32 vni
, __u8 ttl
, __u8 tos
, __be32 label
,
1279 __be16 dst_port
, bool metadata
, u32 flags
)
1281 struct geneve_net
*gn
= net_generic(net
, geneve_net_id
);
1282 struct geneve_dev
*t
, *geneve
= netdev_priv(dev
);
1283 bool tun_collect_md
, tun_on_same_port
;
1289 (remote
->sa
.sa_family
!= AF_UNSPEC
|| vni
|| tos
|| ttl
|| label
))
1295 geneve
->vni
[0] = (vni
& 0x00ff0000) >> 16;
1296 geneve
->vni
[1] = (vni
& 0x0000ff00) >> 8;
1297 geneve
->vni
[2] = vni
& 0x000000ff;
1299 if ((remote
->sa
.sa_family
== AF_INET
&&
1300 IN_MULTICAST(ntohl(remote
->sin
.sin_addr
.s_addr
))) ||
1301 (remote
->sa
.sa_family
== AF_INET6
&&
1302 ipv6_addr_is_multicast(&remote
->sin6
.sin6_addr
)))
1304 if (label
&& remote
->sa
.sa_family
!= AF_INET6
)
1307 geneve
->remote
= *remote
;
1311 geneve
->label
= label
;
1312 geneve
->dst_port
= dst_port
;
1313 geneve
->collect_md
= metadata
;
1314 geneve
->flags
= flags
;
1316 t
= geneve_find_dev(gn
, dst_port
, remote
, geneve
->vni
,
1317 &tun_on_same_port
, &tun_collect_md
);
1321 /* make enough headroom for basic scenario */
1322 encap_len
= GENEVE_BASE_HLEN
+ ETH_HLEN
;
1323 if (remote
->sa
.sa_family
== AF_INET
)
1324 encap_len
+= sizeof(struct iphdr
);
1326 encap_len
+= sizeof(struct ipv6hdr
);
1327 dev
->needed_headroom
= encap_len
+ ETH_HLEN
;
1330 if (tun_on_same_port
)
1337 dst_cache_reset(&geneve
->dst_cache
);
1339 err
= register_netdevice(dev
);
1343 list_add(&geneve
->next
, &gn
->geneve_list
);
1347 static int geneve_newlink(struct net
*net
, struct net_device
*dev
,
1348 struct nlattr
*tb
[], struct nlattr
*data
[])
1350 __be16 dst_port
= htons(GENEVE_UDP_PORT
);
1351 __u8 ttl
= 0, tos
= 0;
1352 bool metadata
= false;
1353 union geneve_addr remote
= geneve_remote_unspec
;
1358 if (data
[IFLA_GENEVE_REMOTE
] && data
[IFLA_GENEVE_REMOTE6
])
1361 if (data
[IFLA_GENEVE_REMOTE
]) {
1362 remote
.sa
.sa_family
= AF_INET
;
1363 remote
.sin
.sin_addr
.s_addr
=
1364 nla_get_in_addr(data
[IFLA_GENEVE_REMOTE
]);
1367 if (data
[IFLA_GENEVE_REMOTE6
]) {
1368 if (!IS_ENABLED(CONFIG_IPV6
))
1369 return -EPFNOSUPPORT
;
1371 remote
.sa
.sa_family
= AF_INET6
;
1372 remote
.sin6
.sin6_addr
=
1373 nla_get_in6_addr(data
[IFLA_GENEVE_REMOTE6
]);
1375 if (ipv6_addr_type(&remote
.sin6
.sin6_addr
) &
1376 IPV6_ADDR_LINKLOCAL
) {
1377 netdev_dbg(dev
, "link-local remote is unsupported\n");
1382 if (data
[IFLA_GENEVE_ID
])
1383 vni
= nla_get_u32(data
[IFLA_GENEVE_ID
]);
1385 if (data
[IFLA_GENEVE_TTL
])
1386 ttl
= nla_get_u8(data
[IFLA_GENEVE_TTL
]);
1388 if (data
[IFLA_GENEVE_TOS
])
1389 tos
= nla_get_u8(data
[IFLA_GENEVE_TOS
]);
1391 if (data
[IFLA_GENEVE_LABEL
])
1392 label
= nla_get_be32(data
[IFLA_GENEVE_LABEL
]) &
1393 IPV6_FLOWLABEL_MASK
;
1395 if (data
[IFLA_GENEVE_PORT
])
1396 dst_port
= nla_get_be16(data
[IFLA_GENEVE_PORT
]);
1398 if (data
[IFLA_GENEVE_COLLECT_METADATA
])
1401 if (data
[IFLA_GENEVE_UDP_CSUM
] &&
1402 !nla_get_u8(data
[IFLA_GENEVE_UDP_CSUM
]))
1403 flags
|= GENEVE_F_UDP_ZERO_CSUM_TX
;
1405 if (data
[IFLA_GENEVE_UDP_ZERO_CSUM6_TX
] &&
1406 nla_get_u8(data
[IFLA_GENEVE_UDP_ZERO_CSUM6_TX
]))
1407 flags
|= GENEVE_F_UDP_ZERO_CSUM6_TX
;
1409 if (data
[IFLA_GENEVE_UDP_ZERO_CSUM6_RX
] &&
1410 nla_get_u8(data
[IFLA_GENEVE_UDP_ZERO_CSUM6_RX
]))
1411 flags
|= GENEVE_F_UDP_ZERO_CSUM6_RX
;
1413 return geneve_configure(net
, dev
, &remote
, vni
, ttl
, tos
, label
,
1414 dst_port
, metadata
, flags
);
1417 static void geneve_dellink(struct net_device
*dev
, struct list_head
*head
)
1419 struct geneve_dev
*geneve
= netdev_priv(dev
);
1421 list_del(&geneve
->next
);
1422 unregister_netdevice_queue(dev
, head
);
1425 static size_t geneve_get_size(const struct net_device
*dev
)
1427 return nla_total_size(sizeof(__u32
)) + /* IFLA_GENEVE_ID */
1428 nla_total_size(sizeof(struct in6_addr
)) + /* IFLA_GENEVE_REMOTE{6} */
1429 nla_total_size(sizeof(__u8
)) + /* IFLA_GENEVE_TTL */
1430 nla_total_size(sizeof(__u8
)) + /* IFLA_GENEVE_TOS */
1431 nla_total_size(sizeof(__be32
)) + /* IFLA_GENEVE_LABEL */
1432 nla_total_size(sizeof(__be16
)) + /* IFLA_GENEVE_PORT */
1433 nla_total_size(0) + /* IFLA_GENEVE_COLLECT_METADATA */
1434 nla_total_size(sizeof(__u8
)) + /* IFLA_GENEVE_UDP_CSUM */
1435 nla_total_size(sizeof(__u8
)) + /* IFLA_GENEVE_UDP_ZERO_CSUM6_TX */
1436 nla_total_size(sizeof(__u8
)) + /* IFLA_GENEVE_UDP_ZERO_CSUM6_RX */
1440 static int geneve_fill_info(struct sk_buff
*skb
, const struct net_device
*dev
)
1442 struct geneve_dev
*geneve
= netdev_priv(dev
);
1445 vni
= (geneve
->vni
[0] << 16) | (geneve
->vni
[1] << 8) | geneve
->vni
[2];
1446 if (nla_put_u32(skb
, IFLA_GENEVE_ID
, vni
))
1447 goto nla_put_failure
;
1449 if (geneve
->remote
.sa
.sa_family
== AF_INET
) {
1450 if (nla_put_in_addr(skb
, IFLA_GENEVE_REMOTE
,
1451 geneve
->remote
.sin
.sin_addr
.s_addr
))
1452 goto nla_put_failure
;
1453 #if IS_ENABLED(CONFIG_IPV6)
1455 if (nla_put_in6_addr(skb
, IFLA_GENEVE_REMOTE6
,
1456 &geneve
->remote
.sin6
.sin6_addr
))
1457 goto nla_put_failure
;
1461 if (nla_put_u8(skb
, IFLA_GENEVE_TTL
, geneve
->ttl
) ||
1462 nla_put_u8(skb
, IFLA_GENEVE_TOS
, geneve
->tos
) ||
1463 nla_put_be32(skb
, IFLA_GENEVE_LABEL
, geneve
->label
))
1464 goto nla_put_failure
;
1466 if (nla_put_be16(skb
, IFLA_GENEVE_PORT
, geneve
->dst_port
))
1467 goto nla_put_failure
;
1469 if (geneve
->collect_md
) {
1470 if (nla_put_flag(skb
, IFLA_GENEVE_COLLECT_METADATA
))
1471 goto nla_put_failure
;
1474 if (nla_put_u8(skb
, IFLA_GENEVE_UDP_CSUM
,
1475 !(geneve
->flags
& GENEVE_F_UDP_ZERO_CSUM_TX
)) ||
1476 nla_put_u8(skb
, IFLA_GENEVE_UDP_ZERO_CSUM6_TX
,
1477 !!(geneve
->flags
& GENEVE_F_UDP_ZERO_CSUM6_TX
)) ||
1478 nla_put_u8(skb
, IFLA_GENEVE_UDP_ZERO_CSUM6_RX
,
1479 !!(geneve
->flags
& GENEVE_F_UDP_ZERO_CSUM6_RX
)))
1480 goto nla_put_failure
;
1488 static struct rtnl_link_ops geneve_link_ops __read_mostly
= {
1490 .maxtype
= IFLA_GENEVE_MAX
,
1491 .policy
= geneve_policy
,
1492 .priv_size
= sizeof(struct geneve_dev
),
1493 .setup
= geneve_setup
,
1494 .validate
= geneve_validate
,
1495 .newlink
= geneve_newlink
,
1496 .dellink
= geneve_dellink
,
1497 .get_size
= geneve_get_size
,
1498 .fill_info
= geneve_fill_info
,
1501 struct net_device
*geneve_dev_create_fb(struct net
*net
, const char *name
,
1502 u8 name_assign_type
, u16 dst_port
)
1504 struct nlattr
*tb
[IFLA_MAX
+ 1];
1505 struct net_device
*dev
;
1506 LIST_HEAD(list_kill
);
1509 memset(tb
, 0, sizeof(tb
));
1510 dev
= rtnl_create_link(net
, name
, name_assign_type
,
1511 &geneve_link_ops
, tb
);
1515 err
= geneve_configure(net
, dev
, &geneve_remote_unspec
,
1516 0, 0, 0, 0, htons(dst_port
), true,
1517 GENEVE_F_UDP_ZERO_CSUM6_RX
);
1520 return ERR_PTR(err
);
1523 /* openvswitch users expect packet sizes to be unrestricted,
1524 * so set the largest MTU we can.
1526 err
= __geneve_change_mtu(dev
, IP_MAX_MTU
, false);
1530 err
= rtnl_configure_link(dev
, NULL
);
1537 geneve_dellink(dev
, &list_kill
);
1538 unregister_netdevice_many(&list_kill
);
1539 return ERR_PTR(err
);
1541 EXPORT_SYMBOL_GPL(geneve_dev_create_fb
);
1543 static int geneve_netdevice_event(struct notifier_block
*unused
,
1544 unsigned long event
, void *ptr
)
1546 struct net_device
*dev
= netdev_notifier_info_to_dev(ptr
);
1548 if (event
== NETDEV_UDP_TUNNEL_PUSH_INFO
)
1549 geneve_push_rx_ports(dev
);
1554 static struct notifier_block geneve_notifier_block __read_mostly
= {
1555 .notifier_call
= geneve_netdevice_event
,
1558 static __net_init
int geneve_init_net(struct net
*net
)
1560 struct geneve_net
*gn
= net_generic(net
, geneve_net_id
);
1562 INIT_LIST_HEAD(&gn
->geneve_list
);
1563 INIT_LIST_HEAD(&gn
->sock_list
);
1567 static void __net_exit
geneve_exit_net(struct net
*net
)
1569 struct geneve_net
*gn
= net_generic(net
, geneve_net_id
);
1570 struct geneve_dev
*geneve
, *next
;
1571 struct net_device
*dev
, *aux
;
1576 /* gather any geneve devices that were moved into this ns */
1577 for_each_netdev_safe(net
, dev
, aux
)
1578 if (dev
->rtnl_link_ops
== &geneve_link_ops
)
1579 unregister_netdevice_queue(dev
, &list
);
1581 /* now gather any other geneve devices that were created in this ns */
1582 list_for_each_entry_safe(geneve
, next
, &gn
->geneve_list
, next
) {
1583 /* If geneve->dev is in the same netns, it was already added
1584 * to the list by the previous loop.
1586 if (!net_eq(dev_net(geneve
->dev
), net
))
1587 unregister_netdevice_queue(geneve
->dev
, &list
);
1590 /* unregister the devices gathered above */
1591 unregister_netdevice_many(&list
);
1595 static struct pernet_operations geneve_net_ops
= {
1596 .init
= geneve_init_net
,
1597 .exit
= geneve_exit_net
,
1598 .id
= &geneve_net_id
,
1599 .size
= sizeof(struct geneve_net
),
1602 static int __init
geneve_init_module(void)
1606 rc
= register_pernet_subsys(&geneve_net_ops
);
1610 rc
= register_netdevice_notifier(&geneve_notifier_block
);
1614 rc
= rtnl_link_register(&geneve_link_ops
);
1621 unregister_netdevice_notifier(&geneve_notifier_block
);
1623 unregister_pernet_subsys(&geneve_net_ops
);
1627 late_initcall(geneve_init_module
);
1629 static void __exit
geneve_cleanup_module(void)
1631 rtnl_link_unregister(&geneve_link_ops
);
1632 unregister_netdevice_notifier(&geneve_notifier_block
);
1633 unregister_pernet_subsys(&geneve_net_ops
);
1635 module_exit(geneve_cleanup_module
);
1637 MODULE_LICENSE("GPL");
1638 MODULE_VERSION(GENEVE_NETDEV_VER
);
1639 MODULE_AUTHOR("John W. Linville <linville@tuxdriver.com>");
1640 MODULE_DESCRIPTION("Interface driver for GENEVE encapsulated traffic");
1641 MODULE_ALIAS_RTNL_LINK("geneve");