2 * IPv6 over IPv4 tunnel device - Simple Internet Transition (SIT)
3 * Linux INET6 implementation
6 * Pedro Roque <roque@di.fc.ul.pt>
7 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU General Public License
11 * as published by the Free Software Foundation; either version
12 * 2 of the License, or (at your option) any later version.
15 * Roger Venning <r.venning@telstra.com>: 6to4 support
16 * Nate Thompson <nate@thebog.net>: 6to4 support
17 * Fred Templin <fred.l.templin@boeing.com>: isatap support
18 * Sascha Hlusiak <mail@saschahlusiak.de>: stateless autoconf for isatap
21 #include <linux/module.h>
22 #include <linux/capability.h>
23 #include <linux/errno.h>
24 #include <linux/types.h>
25 #include <linux/socket.h>
26 #include <linux/sockios.h>
27 #include <linux/net.h>
28 #include <linux/in6.h>
29 #include <linux/netdevice.h>
30 #include <linux/if_arp.h>
31 #include <linux/icmp.h>
32 #include <asm/uaccess.h>
33 #include <linux/init.h>
34 #include <linux/netfilter_ipv4.h>
35 #include <linux/if_ether.h>
41 #include <net/protocol.h>
42 #include <net/transp_v6.h>
43 #include <net/ip6_fib.h>
44 #include <net/ip6_route.h>
45 #include <net/ndisc.h>
46 #include <net/addrconf.h>
51 #include <net/inet_ecn.h>
53 #include <net/dsfield.h>
54 #include <net/net_namespace.h>
55 #include <net/netns/generic.h>
58 This version of net/ipv6/sit.c is cloned of net/ipv4/ip_gre.c
60 For comments look at net/ipv4/ip_gre.c --ANK
64 #define HASH(addr) (((__force u32)addr^((__force u32)addr>>4))&0xF)
66 static void ipip6_fb_tunnel_init(struct net_device
*dev
);
67 static void ipip6_tunnel_init(struct net_device
*dev
);
68 static void ipip6_tunnel_setup(struct net_device
*dev
);
70 static int sit_net_id
;
72 struct ip_tunnel
*tunnels_r_l
[HASH_SIZE
];
73 struct ip_tunnel
*tunnels_r
[HASH_SIZE
];
74 struct ip_tunnel
*tunnels_l
[HASH_SIZE
];
75 struct ip_tunnel
*tunnels_wc
[1];
76 struct ip_tunnel
**tunnels
[4];
78 struct net_device
*fb_tunnel_dev
;
81 static DEFINE_RWLOCK(ipip6_lock
);
83 static struct ip_tunnel
* ipip6_tunnel_lookup(struct net
*net
,
84 struct net_device
*dev
, __be32 remote
, __be32 local
)
86 unsigned h0
= HASH(remote
);
87 unsigned h1
= HASH(local
);
89 struct sit_net
*sitn
= net_generic(net
, sit_net_id
);
91 for (t
= sitn
->tunnels_r_l
[h0
^h1
]; t
; t
= t
->next
) {
92 if (local
== t
->parms
.iph
.saddr
&&
93 remote
== t
->parms
.iph
.daddr
&&
94 (!dev
|| !t
->parms
.link
|| dev
->iflink
== t
->parms
.link
) &&
95 (t
->dev
->flags
& IFF_UP
))
98 for (t
= sitn
->tunnels_r
[h0
]; t
; t
= t
->next
) {
99 if (remote
== t
->parms
.iph
.daddr
&&
100 (!dev
|| !t
->parms
.link
|| dev
->iflink
== t
->parms
.link
) &&
101 (t
->dev
->flags
& IFF_UP
))
104 for (t
= sitn
->tunnels_l
[h1
]; t
; t
= t
->next
) {
105 if (local
== t
->parms
.iph
.saddr
&&
106 (!dev
|| !t
->parms
.link
|| dev
->iflink
== t
->parms
.link
) &&
107 (t
->dev
->flags
& IFF_UP
))
110 t
= sitn
->tunnels_wc
[0];
111 if ((t
!= NULL
) && (t
->dev
->flags
& IFF_UP
))
116 static struct ip_tunnel
**__ipip6_bucket(struct sit_net
*sitn
,
117 struct ip_tunnel_parm
*parms
)
119 __be32 remote
= parms
->iph
.daddr
;
120 __be32 local
= parms
->iph
.saddr
;
132 return &sitn
->tunnels
[prio
][h
];
135 static inline struct ip_tunnel
**ipip6_bucket(struct sit_net
*sitn
,
138 return __ipip6_bucket(sitn
, &t
->parms
);
141 static void ipip6_tunnel_unlink(struct sit_net
*sitn
, struct ip_tunnel
*t
)
143 struct ip_tunnel
**tp
;
145 for (tp
= ipip6_bucket(sitn
, t
); *tp
; tp
= &(*tp
)->next
) {
147 write_lock_bh(&ipip6_lock
);
149 write_unlock_bh(&ipip6_lock
);
155 static void ipip6_tunnel_link(struct sit_net
*sitn
, struct ip_tunnel
*t
)
157 struct ip_tunnel
**tp
= ipip6_bucket(sitn
, t
);
160 write_lock_bh(&ipip6_lock
);
162 write_unlock_bh(&ipip6_lock
);
165 static struct ip_tunnel
* ipip6_tunnel_locate(struct net
*net
,
166 struct ip_tunnel_parm
*parms
, int create
)
168 __be32 remote
= parms
->iph
.daddr
;
169 __be32 local
= parms
->iph
.saddr
;
170 struct ip_tunnel
*t
, **tp
, *nt
;
171 struct net_device
*dev
;
173 struct sit_net
*sitn
= net_generic(net
, sit_net_id
);
175 for (tp
= __ipip6_bucket(sitn
, parms
); (t
= *tp
) != NULL
; tp
= &t
->next
) {
176 if (local
== t
->parms
.iph
.saddr
&&
177 remote
== t
->parms
.iph
.daddr
&&
178 parms
->link
== t
->parms
.link
) {
189 strlcpy(name
, parms
->name
, IFNAMSIZ
);
191 sprintf(name
, "sit%%d");
193 dev
= alloc_netdev(sizeof(*t
), name
, ipip6_tunnel_setup
);
197 dev_net_set(dev
, net
);
199 if (strchr(name
, '%')) {
200 if (dev_alloc_name(dev
, name
) < 0)
204 nt
= netdev_priv(dev
);
207 ipip6_tunnel_init(dev
);
209 if (parms
->i_flags
& SIT_ISATAP
)
210 dev
->priv_flags
|= IFF_ISATAP
;
212 if (register_netdevice(dev
) < 0)
217 ipip6_tunnel_link(sitn
, nt
);
226 static void ipip6_tunnel_rs_timer(unsigned long data
)
228 struct ip_tunnel_prl_entry
*p
= (struct ip_tunnel_prl_entry
*) data
;
229 struct inet6_dev
*ifp
;
230 struct inet6_ifaddr
*addr
;
233 ifp
= __in6_dev_get(p
->tunnel
->dev
);
235 read_lock_bh(&ifp
->lock
);
236 for (addr
= ifp
->addr_list
; addr
; addr
= addr
->if_next
) {
239 if (!(ipv6_addr_type(&addr
->addr
) & IPV6_ADDR_LINKLOCAL
))
242 /* Send RS to guessed linklocal address of router
244 * Better: send to ff02::2 encapsuled in unicast directly
245 * to router-v4 instead of guessing the v6 address.
247 * Cisco/Windows seem to not set the u/l bit correctly,
248 * so we won't guess right.
250 ipv6_addr_set(&rtr
, htonl(0xFE800000), 0, 0, 0);
251 if (!__ipv6_isatap_ifid(rtr
.s6_addr
+ 8,
253 ndisc_send_rs(p
->tunnel
->dev
, &addr
->addr
, &rtr
);
256 read_unlock_bh(&ifp
->lock
);
258 mod_timer(&p
->rs_timer
, jiffies
+ HZ
* p
->rs_delay
);
259 spin_unlock(&p
->lock
);
264 static struct ip_tunnel_prl_entry
*
265 __ipip6_tunnel_locate_prl(struct ip_tunnel
*t
, __be32 addr
)
267 struct ip_tunnel_prl_entry
*p
= (struct ip_tunnel_prl_entry
*)NULL
;
269 for (p
= t
->prl
; p
; p
= p
->next
)
276 static int ipip6_tunnel_get_prl(struct ip_tunnel
*t
,
277 struct ip_tunnel_prl __user
*a
)
279 struct ip_tunnel_prl kprl
, *kp
;
280 struct ip_tunnel_prl_entry
*prl
;
281 unsigned int cmax
, c
= 0, ca
, len
;
284 if (copy_from_user(&kprl
, a
, sizeof(kprl
)))
286 cmax
= kprl
.datalen
/ sizeof(kprl
);
287 if (cmax
> 1 && kprl
.addr
!= htonl(INADDR_ANY
))
290 /* For simple GET or for root users,
291 * we try harder to allocate.
293 kp
= (cmax
<= 1 || capable(CAP_NET_ADMIN
)) ?
294 kcalloc(cmax
, sizeof(*kp
), GFP_KERNEL
) :
297 read_lock(&ipip6_lock
);
299 ca
= t
->prl_count
< cmax
? t
->prl_count
: cmax
;
302 /* We don't try hard to allocate much memory for
304 * For root users, retry allocating enough memory for
307 kp
= kcalloc(ca
, sizeof(*kp
), GFP_ATOMIC
);
315 for (prl
= t
->prl
; prl
; prl
= prl
->next
) {
318 if (kprl
.addr
!= htonl(INADDR_ANY
) && prl
->addr
!= kprl
.addr
)
320 kp
[c
].addr
= prl
->addr
;
321 kp
[c
].flags
= prl
->flags
;
322 kp
[c
].rs_delay
= prl
->rs_delay
;
324 if (kprl
.addr
!= htonl(INADDR_ANY
))
328 read_unlock(&ipip6_lock
);
330 len
= sizeof(*kp
) * c
;
332 if ((len
&& copy_to_user(a
+ 1, kp
, len
)) || put_user(len
, &a
->datalen
))
341 ipip6_tunnel_add_prl(struct ip_tunnel
*t
, struct ip_tunnel_prl
*a
, int chg
)
343 struct ip_tunnel_prl_entry
*p
;
346 if (a
->addr
== htonl(INADDR_ANY
))
349 write_lock(&ipip6_lock
);
351 for (p
= t
->prl
; p
; p
= p
->next
) {
352 if (p
->addr
== a
->addr
) {
365 p
= kzalloc(sizeof(struct ip_tunnel_prl_entry
), GFP_KERNEL
);
376 spin_lock_init(&p
->lock
);
377 setup_timer(&p
->rs_timer
, ipip6_tunnel_rs_timer
, (unsigned long) p
);
381 p
->rs_delay
= a
->rs_delay
;
382 if (p
->rs_delay
== 0)
383 p
->rs_delay
= IPTUNNEL_RS_DEFAULT_DELAY
;
385 del_timer(&p
->rs_timer
);
386 if (p
->flags
& PRL_DEFAULT
)
387 mod_timer(&p
->rs_timer
, jiffies
+ 1);
388 spin_unlock(&p
->lock
);
390 write_unlock(&ipip6_lock
);
395 ipip6_tunnel_del_prl(struct ip_tunnel
*t
, struct ip_tunnel_prl
*a
)
397 struct ip_tunnel_prl_entry
*x
, **p
;
400 write_lock(&ipip6_lock
);
402 if (a
&& a
->addr
!= htonl(INADDR_ANY
)) {
403 for (p
= &t
->prl
; *p
; p
= &(*p
)->next
) {
404 if ((*p
)->addr
== a
->addr
) {
408 del_timer(&x
->rs_timer
);
409 spin_unlock(&x
->lock
);
419 t
->prl
= t
->prl
->next
;
421 del_timer(&x
->rs_timer
);
422 spin_unlock(&x
->lock
);
428 write_unlock(&ipip6_lock
);
433 isatap_chksrc(struct sk_buff
*skb
, struct iphdr
*iph
, struct ip_tunnel
*t
)
435 struct ip_tunnel_prl_entry
*p
;
438 read_lock(&ipip6_lock
);
439 p
= __ipip6_tunnel_locate_prl(t
, iph
->saddr
);
441 if (p
->flags
& PRL_DEFAULT
)
442 skb
->ndisc_nodetype
= NDISC_NODETYPE_DEFAULT
;
444 skb
->ndisc_nodetype
= NDISC_NODETYPE_NODEFAULT
;
446 struct in6_addr
*addr6
= &ipv6_hdr(skb
)->saddr
;
447 if (ipv6_addr_is_isatap(addr6
) &&
448 (addr6
->s6_addr32
[3] == iph
->saddr
) &&
449 ipv6_chk_prefix(addr6
, t
->dev
))
450 skb
->ndisc_nodetype
= NDISC_NODETYPE_HOST
;
454 read_unlock(&ipip6_lock
);
458 static void ipip6_tunnel_uninit(struct net_device
*dev
)
460 struct net
*net
= dev_net(dev
);
461 struct sit_net
*sitn
= net_generic(net
, sit_net_id
);
463 if (dev
== sitn
->fb_tunnel_dev
) {
464 write_lock_bh(&ipip6_lock
);
465 sitn
->tunnels_wc
[0] = NULL
;
466 write_unlock_bh(&ipip6_lock
);
469 ipip6_tunnel_unlink(sitn
, netdev_priv(dev
));
470 ipip6_tunnel_del_prl(netdev_priv(dev
), NULL
);
476 static int ipip6_err(struct sk_buff
*skb
, u32 info
)
479 /* All the routers (except for Linux) return only
480 8 bytes of packet payload. It means, that precise relaying of
481 ICMP in the real Internet is absolutely infeasible.
483 struct iphdr
*iph
= (struct iphdr
*)skb
->data
;
484 const int type
= icmp_hdr(skb
)->type
;
485 const int code
= icmp_hdr(skb
)->code
;
491 case ICMP_PARAMETERPROB
:
494 case ICMP_DEST_UNREACH
:
497 case ICMP_PORT_UNREACH
:
498 /* Impossible event. */
500 case ICMP_FRAG_NEEDED
:
501 /* Soft state for pmtu is maintained by IP core. */
504 /* All others are translated to HOST_UNREACH.
505 rfc2003 contains "deep thoughts" about NET_UNREACH,
506 I believe they are just ether pollution. --ANK
511 case ICMP_TIME_EXCEEDED
:
512 if (code
!= ICMP_EXC_TTL
)
519 read_lock(&ipip6_lock
);
520 t
= ipip6_tunnel_lookup(dev_net(skb
->dev
),
524 if (t
== NULL
|| t
->parms
.iph
.daddr
== 0)
528 if (t
->parms
.iph
.ttl
== 0 && type
== ICMP_TIME_EXCEEDED
)
531 if (time_before(jiffies
, t
->err_time
+ IPTUNNEL_ERR_TIMEO
))
535 t
->err_time
= jiffies
;
537 read_unlock(&ipip6_lock
);
541 static inline void ipip6_ecn_decapsulate(struct iphdr
*iph
, struct sk_buff
*skb
)
543 if (INET_ECN_is_ce(iph
->tos
))
544 IP6_ECN_set_ce(ipv6_hdr(skb
));
547 static int ipip6_rcv(struct sk_buff
*skb
)
550 struct ip_tunnel
*tunnel
;
552 if (!pskb_may_pull(skb
, sizeof(struct ipv6hdr
)))
557 read_lock(&ipip6_lock
);
558 tunnel
= ipip6_tunnel_lookup(dev_net(skb
->dev
), skb
->dev
,
559 iph
->saddr
, iph
->daddr
);
560 if (tunnel
!= NULL
) {
562 skb
->mac_header
= skb
->network_header
;
563 skb_reset_network_header(skb
);
564 IPCB(skb
)->flags
= 0;
565 skb
->protocol
= htons(ETH_P_IPV6
);
566 skb
->pkt_type
= PACKET_HOST
;
568 if ((tunnel
->dev
->priv_flags
& IFF_ISATAP
) &&
569 !isatap_chksrc(skb
, iph
, tunnel
)) {
570 tunnel
->dev
->stats
.rx_errors
++;
571 read_unlock(&ipip6_lock
);
575 tunnel
->dev
->stats
.rx_packets
++;
576 tunnel
->dev
->stats
.rx_bytes
+= skb
->len
;
577 skb
->dev
= tunnel
->dev
;
580 ipip6_ecn_decapsulate(iph
, skb
);
582 read_unlock(&ipip6_lock
);
586 icmp_send(skb
, ICMP_DEST_UNREACH
, ICMP_PORT_UNREACH
, 0);
587 read_unlock(&ipip6_lock
);
593 /* Returns the embedded IPv4 address if the IPv6 address
594 comes from 6to4 (RFC 3056) addr space */
596 static inline __be32
try_6to4(struct in6_addr
*v6dst
)
600 if (v6dst
->s6_addr16
[0] == htons(0x2002)) {
601 /* 6to4 v6 addr has 16 bits prefix, 32 v4addr, 16 SLA, ... */
602 memcpy(&dst
, &v6dst
->s6_addr16
[1], 4);
608 * This function assumes it is being called from dev_queue_xmit()
609 * and that skb is filled properly by that function.
612 static netdev_tx_t
ipip6_tunnel_xmit(struct sk_buff
*skb
,
613 struct net_device
*dev
)
615 struct ip_tunnel
*tunnel
= netdev_priv(dev
);
616 struct net_device_stats
*stats
= &tunnel
->dev
->stats
;
617 struct iphdr
*tiph
= &tunnel
->parms
.iph
;
618 struct ipv6hdr
*iph6
= ipv6_hdr(skb
);
619 u8 tos
= tunnel
->parms
.iph
.tos
;
620 struct rtable
*rt
; /* Route to the other host */
621 struct net_device
*tdev
; /* Device to other host */
622 struct iphdr
*iph
; /* Our new IP header */
623 unsigned int max_headroom
; /* The extra header space needed */
624 __be32 dst
= tiph
->daddr
;
626 struct in6_addr
*addr6
;
629 if (tunnel
->recursion
++) {
634 if (skb
->protocol
!= htons(ETH_P_IPV6
))
637 /* ISATAP (RFC4214) - must come before 6to4 */
638 if (dev
->priv_flags
& IFF_ISATAP
) {
639 struct neighbour
*neigh
= NULL
;
642 neigh
= skb_dst(skb
)->neighbour
;
646 printk(KERN_DEBUG
"sit: nexthop == NULL\n");
650 addr6
= (struct in6_addr
*)&neigh
->primary_key
;
651 addr_type
= ipv6_addr_type(addr6
);
653 if ((addr_type
& IPV6_ADDR_UNICAST
) &&
654 ipv6_addr_is_isatap(addr6
))
655 dst
= addr6
->s6_addr32
[3];
661 dst
= try_6to4(&iph6
->daddr
);
664 struct neighbour
*neigh
= NULL
;
667 neigh
= skb_dst(skb
)->neighbour
;
671 printk(KERN_DEBUG
"sit: nexthop == NULL\n");
675 addr6
= (struct in6_addr
*)&neigh
->primary_key
;
676 addr_type
= ipv6_addr_type(addr6
);
678 if (addr_type
== IPV6_ADDR_ANY
) {
679 addr6
= &ipv6_hdr(skb
)->daddr
;
680 addr_type
= ipv6_addr_type(addr6
);
683 if ((addr_type
& IPV6_ADDR_COMPATv4
) == 0)
686 dst
= addr6
->s6_addr32
[3];
690 struct flowi fl
= { .nl_u
= { .ip4_u
=
692 .saddr
= tiph
->saddr
,
693 .tos
= RT_TOS(tos
) } },
694 .oif
= tunnel
->parms
.link
,
695 .proto
= IPPROTO_IPV6
};
696 if (ip_route_output_key(dev_net(dev
), &rt
, &fl
)) {
697 stats
->tx_carrier_errors
++;
701 if (rt
->rt_type
!= RTN_UNICAST
) {
703 stats
->tx_carrier_errors
++;
706 tdev
= rt
->u
.dst
.dev
;
715 mtu
= dst_mtu(&rt
->u
.dst
) - sizeof(struct iphdr
);
717 mtu
= skb_dst(skb
) ? dst_mtu(skb_dst(skb
)) : dev
->mtu
;
724 if (mtu
< IPV6_MIN_MTU
)
726 if (tunnel
->parms
.iph
.daddr
&& skb_dst(skb
))
727 skb_dst(skb
)->ops
->update_pmtu(skb_dst(skb
), mtu
);
729 if (skb
->len
> mtu
) {
730 icmpv6_send(skb
, ICMPV6_PKT_TOOBIG
, 0, mtu
, dev
);
735 if (tunnel
->err_count
> 0) {
736 if (time_before(jiffies
,
737 tunnel
->err_time
+ IPTUNNEL_ERR_TIMEO
)) {
739 dst_link_failure(skb
);
741 tunnel
->err_count
= 0;
745 * Okay, now see if we can stuff it in the buffer as-is.
747 max_headroom
= LL_RESERVED_SPACE(tdev
)+sizeof(struct iphdr
);
749 if (skb_headroom(skb
) < max_headroom
|| skb_shared(skb
) ||
750 (skb_cloned(skb
) && !skb_clone_writable(skb
, 0))) {
751 struct sk_buff
*new_skb
= skb_realloc_headroom(skb
, max_headroom
);
760 skb_set_owner_w(new_skb
, skb
->sk
);
763 iph6
= ipv6_hdr(skb
);
766 skb
->transport_header
= skb
->network_header
;
767 skb_push(skb
, sizeof(struct iphdr
));
768 skb_reset_network_header(skb
);
769 memset(&(IPCB(skb
)->opt
), 0, sizeof(IPCB(skb
)->opt
));
770 IPCB(skb
)->flags
= 0;
772 skb_dst_set(skb
, &rt
->u
.dst
);
775 * Push down and install the IPIP header.
780 iph
->ihl
= sizeof(struct iphdr
)>>2;
781 if (mtu
> IPV6_MIN_MTU
)
782 iph
->frag_off
= tiph
->frag_off
;
786 iph
->protocol
= IPPROTO_IPV6
;
787 iph
->tos
= INET_ECN_encapsulate(tos
, ipv6_get_dsfield(iph6
));
788 iph
->daddr
= rt
->rt_dst
;
789 iph
->saddr
= rt
->rt_src
;
791 if ((iph
->ttl
= tiph
->ttl
) == 0)
792 iph
->ttl
= iph6
->hop_limit
;
801 dst_link_failure(skb
);
809 static void ipip6_tunnel_bind_dev(struct net_device
*dev
)
811 struct net_device
*tdev
= NULL
;
812 struct ip_tunnel
*tunnel
;
815 tunnel
= netdev_priv(dev
);
816 iph
= &tunnel
->parms
.iph
;
819 struct flowi fl
= { .nl_u
= { .ip4_u
=
820 { .daddr
= iph
->daddr
,
822 .tos
= RT_TOS(iph
->tos
) } },
823 .oif
= tunnel
->parms
.link
,
824 .proto
= IPPROTO_IPV6
};
826 if (!ip_route_output_key(dev_net(dev
), &rt
, &fl
)) {
827 tdev
= rt
->u
.dst
.dev
;
830 dev
->flags
|= IFF_POINTOPOINT
;
833 if (!tdev
&& tunnel
->parms
.link
)
834 tdev
= __dev_get_by_index(dev_net(dev
), tunnel
->parms
.link
);
837 dev
->hard_header_len
= tdev
->hard_header_len
+ sizeof(struct iphdr
);
838 dev
->mtu
= tdev
->mtu
- sizeof(struct iphdr
);
839 if (dev
->mtu
< IPV6_MIN_MTU
)
840 dev
->mtu
= IPV6_MIN_MTU
;
842 dev
->iflink
= tunnel
->parms
.link
;
846 ipip6_tunnel_ioctl (struct net_device
*dev
, struct ifreq
*ifr
, int cmd
)
849 struct ip_tunnel_parm p
;
850 struct ip_tunnel_prl prl
;
852 struct net
*net
= dev_net(dev
);
853 struct sit_net
*sitn
= net_generic(net
, sit_net_id
);
858 if (dev
== sitn
->fb_tunnel_dev
) {
859 if (copy_from_user(&p
, ifr
->ifr_ifru
.ifru_data
, sizeof(p
))) {
863 t
= ipip6_tunnel_locate(net
, &p
, 0);
866 t
= netdev_priv(dev
);
867 memcpy(&p
, &t
->parms
, sizeof(p
));
868 if (copy_to_user(ifr
->ifr_ifru
.ifru_data
, &p
, sizeof(p
)))
875 if (!capable(CAP_NET_ADMIN
))
879 if (copy_from_user(&p
, ifr
->ifr_ifru
.ifru_data
, sizeof(p
)))
883 if (p
.iph
.version
!= 4 || p
.iph
.protocol
!= IPPROTO_IPV6
||
884 p
.iph
.ihl
!= 5 || (p
.iph
.frag_off
&htons(~IP_DF
)))
887 p
.iph
.frag_off
|= htons(IP_DF
);
889 t
= ipip6_tunnel_locate(net
, &p
, cmd
== SIOCADDTUNNEL
);
891 if (dev
!= sitn
->fb_tunnel_dev
&& cmd
== SIOCCHGTUNNEL
) {
898 if (((dev
->flags
&IFF_POINTOPOINT
) && !p
.iph
.daddr
) ||
899 (!(dev
->flags
&IFF_POINTOPOINT
) && p
.iph
.daddr
)) {
903 t
= netdev_priv(dev
);
904 ipip6_tunnel_unlink(sitn
, t
);
905 t
->parms
.iph
.saddr
= p
.iph
.saddr
;
906 t
->parms
.iph
.daddr
= p
.iph
.daddr
;
907 memcpy(dev
->dev_addr
, &p
.iph
.saddr
, 4);
908 memcpy(dev
->broadcast
, &p
.iph
.daddr
, 4);
909 ipip6_tunnel_link(sitn
, t
);
910 netdev_state_change(dev
);
916 if (cmd
== SIOCCHGTUNNEL
) {
917 t
->parms
.iph
.ttl
= p
.iph
.ttl
;
918 t
->parms
.iph
.tos
= p
.iph
.tos
;
919 if (t
->parms
.link
!= p
.link
) {
920 t
->parms
.link
= p
.link
;
921 ipip6_tunnel_bind_dev(dev
);
922 netdev_state_change(dev
);
925 if (copy_to_user(ifr
->ifr_ifru
.ifru_data
, &t
->parms
, sizeof(p
)))
928 err
= (cmd
== SIOCADDTUNNEL
? -ENOBUFS
: -ENOENT
);
933 if (!capable(CAP_NET_ADMIN
))
936 if (dev
== sitn
->fb_tunnel_dev
) {
938 if (copy_from_user(&p
, ifr
->ifr_ifru
.ifru_data
, sizeof(p
)))
941 if ((t
= ipip6_tunnel_locate(net
, &p
, 0)) == NULL
)
944 if (t
== netdev_priv(sitn
->fb_tunnel_dev
))
948 unregister_netdevice(dev
);
954 if (dev
== sitn
->fb_tunnel_dev
)
957 if (!(t
= netdev_priv(dev
)))
959 err
= ipip6_tunnel_get_prl(t
, ifr
->ifr_ifru
.ifru_data
);
966 if (!capable(CAP_NET_ADMIN
))
969 if (dev
== sitn
->fb_tunnel_dev
)
972 if (copy_from_user(&prl
, ifr
->ifr_ifru
.ifru_data
, sizeof(prl
)))
975 if (!(t
= netdev_priv(dev
)))
980 err
= ipip6_tunnel_del_prl(t
, &prl
);
984 err
= ipip6_tunnel_add_prl(t
, &prl
, cmd
== SIOCCHGPRL
);
987 netdev_state_change(dev
);
998 static int ipip6_tunnel_change_mtu(struct net_device
*dev
, int new_mtu
)
1000 if (new_mtu
< IPV6_MIN_MTU
|| new_mtu
> 0xFFF8 - sizeof(struct iphdr
))
1006 static const struct net_device_ops ipip6_netdev_ops
= {
1007 .ndo_uninit
= ipip6_tunnel_uninit
,
1008 .ndo_start_xmit
= ipip6_tunnel_xmit
,
1009 .ndo_do_ioctl
= ipip6_tunnel_ioctl
,
1010 .ndo_change_mtu
= ipip6_tunnel_change_mtu
,
1013 static void ipip6_tunnel_setup(struct net_device
*dev
)
1015 dev
->netdev_ops
= &ipip6_netdev_ops
;
1016 dev
->destructor
= free_netdev
;
1018 dev
->type
= ARPHRD_SIT
;
1019 dev
->hard_header_len
= LL_MAX_HEADER
+ sizeof(struct iphdr
);
1020 dev
->mtu
= ETH_DATA_LEN
- sizeof(struct iphdr
);
1021 dev
->flags
= IFF_NOARP
;
1022 dev
->priv_flags
&= ~IFF_XMIT_DST_RELEASE
;
1025 dev
->features
|= NETIF_F_NETNS_LOCAL
;
1028 static void ipip6_tunnel_init(struct net_device
*dev
)
1030 struct ip_tunnel
*tunnel
= netdev_priv(dev
);
1033 strcpy(tunnel
->parms
.name
, dev
->name
);
1035 memcpy(dev
->dev_addr
, &tunnel
->parms
.iph
.saddr
, 4);
1036 memcpy(dev
->broadcast
, &tunnel
->parms
.iph
.daddr
, 4);
1038 ipip6_tunnel_bind_dev(dev
);
1041 static void ipip6_fb_tunnel_init(struct net_device
*dev
)
1043 struct ip_tunnel
*tunnel
= netdev_priv(dev
);
1044 struct iphdr
*iph
= &tunnel
->parms
.iph
;
1045 struct net
*net
= dev_net(dev
);
1046 struct sit_net
*sitn
= net_generic(net
, sit_net_id
);
1049 strcpy(tunnel
->parms
.name
, dev
->name
);
1052 iph
->protocol
= IPPROTO_IPV6
;
1057 sitn
->tunnels_wc
[0] = tunnel
;
1060 static struct xfrm_tunnel sit_handler
= {
1061 .handler
= ipip6_rcv
,
1062 .err_handler
= ipip6_err
,
1066 static void sit_destroy_tunnels(struct sit_net
*sitn
)
1070 for (prio
= 1; prio
< 4; prio
++) {
1072 for (h
= 0; h
< HASH_SIZE
; h
++) {
1073 struct ip_tunnel
*t
;
1074 while ((t
= sitn
->tunnels
[prio
][h
]) != NULL
)
1075 unregister_netdevice(t
->dev
);
1080 static int sit_init_net(struct net
*net
)
1083 struct sit_net
*sitn
;
1086 sitn
= kzalloc(sizeof(struct sit_net
), GFP_KERNEL
);
1090 err
= net_assign_generic(net
, sit_net_id
, sitn
);
1094 sitn
->tunnels
[0] = sitn
->tunnels_wc
;
1095 sitn
->tunnels
[1] = sitn
->tunnels_l
;
1096 sitn
->tunnels
[2] = sitn
->tunnels_r
;
1097 sitn
->tunnels
[3] = sitn
->tunnels_r_l
;
1099 sitn
->fb_tunnel_dev
= alloc_netdev(sizeof(struct ip_tunnel
), "sit0",
1100 ipip6_tunnel_setup
);
1101 if (!sitn
->fb_tunnel_dev
) {
1105 dev_net_set(sitn
->fb_tunnel_dev
, net
);
1107 ipip6_fb_tunnel_init(sitn
->fb_tunnel_dev
);
1109 if ((err
= register_netdev(sitn
->fb_tunnel_dev
)))
1115 dev_put(sitn
->fb_tunnel_dev
);
1116 free_netdev(sitn
->fb_tunnel_dev
);
1125 static void sit_exit_net(struct net
*net
)
1127 struct sit_net
*sitn
;
1129 sitn
= net_generic(net
, sit_net_id
);
1131 sit_destroy_tunnels(sitn
);
1132 unregister_netdevice(sitn
->fb_tunnel_dev
);
1137 static struct pernet_operations sit_net_ops
= {
1138 .init
= sit_init_net
,
1139 .exit
= sit_exit_net
,
1142 static void __exit
sit_cleanup(void)
1144 xfrm4_tunnel_deregister(&sit_handler
, AF_INET6
);
1146 unregister_pernet_gen_device(sit_net_id
, &sit_net_ops
);
1149 static int __init
sit_init(void)
1153 printk(KERN_INFO
"IPv6 over IPv4 tunneling driver\n");
1155 if (xfrm4_tunnel_register(&sit_handler
, AF_INET6
) < 0) {
1156 printk(KERN_INFO
"sit init: Can't add protocol\n");
1160 err
= register_pernet_gen_device(&sit_net_id
, &sit_net_ops
);
1162 xfrm4_tunnel_deregister(&sit_handler
, AF_INET6
);
1167 module_init(sit_init
);
1168 module_exit(sit_cleanup
);
1169 MODULE_LICENSE("GPL");
1170 MODULE_ALIAS("sit0");