2 * mpls tunnels An implementation mpls tunnels using the light weight tunnel
5 * Authors: Roopa Prabhu, <roopa@cumulusnetworks.com>
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation; either version
10 * 2 of the License, or (at your option) any later version.
13 #include <linux/types.h>
14 #include <linux/skbuff.h>
15 #include <linux/net.h>
16 #include <linux/module.h>
17 #include <linux/mpls.h>
18 #include <linux/vmalloc.h>
21 #include <net/lwtunnel.h>
22 #include <net/netevent.h>
23 #include <net/netns/generic.h>
24 #include <net/ip6_fib.h>
25 #include <net/route.h>
26 #include <net/mpls_iptunnel.h>
27 #include <linux/mpls_iptunnel.h>
30 static const struct nla_policy mpls_iptunnel_policy
[MPLS_IPTUNNEL_MAX
+ 1] = {
31 [MPLS_IPTUNNEL_DST
] = { .type
= NLA_U32
},
32 [MPLS_IPTUNNEL_TTL
] = { .type
= NLA_U8
},
35 static unsigned int mpls_encap_size(struct mpls_iptunnel_encap
*en
)
37 /* The size of the layer 2.5 labels to be added for this route */
38 return en
->labels
* sizeof(struct mpls_shim_hdr
);
41 static int mpls_xmit(struct sk_buff
*skb
)
43 struct mpls_iptunnel_encap
*tun_encap_info
;
44 struct mpls_shim_hdr
*hdr
;
45 struct net_device
*out_dev
;
47 unsigned int new_header_size
;
49 struct dst_entry
*dst
= skb_dst(skb
);
50 struct rtable
*rt
= NULL
;
51 struct rt6_info
*rt6
= NULL
;
52 struct mpls_dev
*out_mdev
;
59 /* Find the output device */
61 net
= dev_net(out_dev
);
65 if (!mpls_output_possible(out_dev
) ||
66 !dst
->lwtstate
|| skb_warn_if_lro(skb
))
69 skb_forward_csum(skb
);
71 tun_encap_info
= mpls_lwtunnel_encap(dst
->lwtstate
);
73 /* Obtain the ttl using the following set of rules.
75 * LWT ttl propagation setting:
76 * - disabled => use default TTL value from LWT
77 * - enabled => use TTL value from IPv4/IPv6 header
79 * Global ttl propagation setting:
80 * - disabled => use default TTL value from global setting
81 * - enabled => use TTL value from IPv4/IPv6 header
83 if (dst
->ops
->family
== AF_INET
) {
84 if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DISABLED
)
85 ttl
= tun_encap_info
->default_ttl
;
86 else if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DEFAULT
&&
87 !net
->mpls
.ip_ttl_propagate
)
88 ttl
= net
->mpls
.default_ttl
;
90 ttl
= ip_hdr(skb
)->ttl
;
91 rt
= (struct rtable
*)dst
;
92 } else if (dst
->ops
->family
== AF_INET6
) {
93 if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DISABLED
)
94 ttl
= tun_encap_info
->default_ttl
;
95 else if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DEFAULT
&&
96 !net
->mpls
.ip_ttl_propagate
)
97 ttl
= net
->mpls
.default_ttl
;
99 ttl
= ipv6_hdr(skb
)->hop_limit
;
100 rt6
= (struct rt6_info
*)dst
;
105 /* Verify the destination can hold the packet */
106 new_header_size
= mpls_encap_size(tun_encap_info
);
107 mtu
= mpls_dev_mtu(out_dev
);
108 if (mpls_pkt_too_big(skb
, mtu
- new_header_size
))
111 hh_len
= LL_RESERVED_SPACE(out_dev
);
112 if (!out_dev
->header_ops
)
115 /* Ensure there is enough space for the headers in the skb */
116 if (skb_cow(skb
, hh_len
+ new_header_size
))
119 skb_set_inner_protocol(skb
, skb
->protocol
);
120 skb_reset_inner_network_header(skb
);
122 skb_push(skb
, new_header_size
);
124 skb_reset_network_header(skb
);
127 skb
->protocol
= htons(ETH_P_MPLS_UC
);
129 /* Push the new labels */
132 for (i
= tun_encap_info
->labels
- 1; i
>= 0; i
--) {
133 hdr
[i
] = mpls_entry_encode(tun_encap_info
->label
[i
],
138 mpls_stats_inc_outucastpkts(out_dev
, skb
);
141 err
= neigh_xmit(NEIGH_ARP_TABLE
, out_dev
, &rt
->rt_gateway
,
144 err
= neigh_xmit(NEIGH_ND_TABLE
, out_dev
, &rt6
->rt6i_gateway
,
147 net_dbg_ratelimited("%s: packet transmission failed: %d\n",
150 return LWTUNNEL_XMIT_DONE
;
153 out_mdev
= out_dev
? mpls_dev_get(out_dev
) : NULL
;
155 MPLS_INC_STATS(out_mdev
, tx_errors
);
160 static int mpls_build_state(struct nlattr
*nla
,
161 unsigned int family
, const void *cfg
,
162 struct lwtunnel_state
**ts
,
163 struct netlink_ext_ack
*extack
)
165 struct mpls_iptunnel_encap
*tun_encap_info
;
166 struct nlattr
*tb
[MPLS_IPTUNNEL_MAX
+ 1];
167 struct lwtunnel_state
*newts
;
171 ret
= nla_parse_nested(tb
, MPLS_IPTUNNEL_MAX
, nla
,
172 mpls_iptunnel_policy
, extack
);
176 if (!tb
[MPLS_IPTUNNEL_DST
]) {
177 NL_SET_ERR_MSG(extack
, "MPLS_IPTUNNEL_DST attribute is missing");
181 /* determine number of labels */
182 if (nla_get_labels(tb
[MPLS_IPTUNNEL_DST
], MAX_NEW_LABELS
,
183 &n_labels
, NULL
, extack
))
186 newts
= lwtunnel_state_alloc(struct_size(tun_encap_info
, label
,
191 tun_encap_info
= mpls_lwtunnel_encap(newts
);
192 ret
= nla_get_labels(tb
[MPLS_IPTUNNEL_DST
], n_labels
,
193 &tun_encap_info
->labels
, tun_encap_info
->label
,
198 tun_encap_info
->ttl_propagate
= MPLS_TTL_PROP_DEFAULT
;
200 if (tb
[MPLS_IPTUNNEL_TTL
]) {
201 tun_encap_info
->default_ttl
= nla_get_u8(tb
[MPLS_IPTUNNEL_TTL
]);
202 /* TTL 0 implies propagate from IP header */
203 tun_encap_info
->ttl_propagate
= tun_encap_info
->default_ttl
?
204 MPLS_TTL_PROP_DISABLED
:
205 MPLS_TTL_PROP_ENABLED
;
208 newts
->type
= LWTUNNEL_ENCAP_MPLS
;
209 newts
->flags
|= LWTUNNEL_STATE_XMIT_REDIRECT
;
210 newts
->headroom
= mpls_encap_size(tun_encap_info
);
223 static int mpls_fill_encap_info(struct sk_buff
*skb
,
224 struct lwtunnel_state
*lwtstate
)
226 struct mpls_iptunnel_encap
*tun_encap_info
;
228 tun_encap_info
= mpls_lwtunnel_encap(lwtstate
);
230 if (nla_put_labels(skb
, MPLS_IPTUNNEL_DST
, tun_encap_info
->labels
,
231 tun_encap_info
->label
))
232 goto nla_put_failure
;
234 if (tun_encap_info
->ttl_propagate
!= MPLS_TTL_PROP_DEFAULT
&&
235 nla_put_u8(skb
, MPLS_IPTUNNEL_TTL
, tun_encap_info
->default_ttl
))
236 goto nla_put_failure
;
244 static int mpls_encap_nlsize(struct lwtunnel_state
*lwtstate
)
246 struct mpls_iptunnel_encap
*tun_encap_info
;
249 tun_encap_info
= mpls_lwtunnel_encap(lwtstate
);
251 nlsize
= nla_total_size(tun_encap_info
->labels
* 4);
253 if (tun_encap_info
->ttl_propagate
!= MPLS_TTL_PROP_DEFAULT
)
254 nlsize
+= nla_total_size(1);
259 static int mpls_encap_cmp(struct lwtunnel_state
*a
, struct lwtunnel_state
*b
)
261 struct mpls_iptunnel_encap
*a_hdr
= mpls_lwtunnel_encap(a
);
262 struct mpls_iptunnel_encap
*b_hdr
= mpls_lwtunnel_encap(b
);
265 if (a_hdr
->labels
!= b_hdr
->labels
||
266 a_hdr
->ttl_propagate
!= b_hdr
->ttl_propagate
||
267 a_hdr
->default_ttl
!= b_hdr
->default_ttl
)
270 for (l
= 0; l
< a_hdr
->labels
; l
++)
271 if (a_hdr
->label
[l
] != b_hdr
->label
[l
])
276 static const struct lwtunnel_encap_ops mpls_iptun_ops
= {
277 .build_state
= mpls_build_state
,
279 .fill_encap
= mpls_fill_encap_info
,
280 .get_encap_size
= mpls_encap_nlsize
,
281 .cmp_encap
= mpls_encap_cmp
,
282 .owner
= THIS_MODULE
,
285 static int __init
mpls_iptunnel_init(void)
287 return lwtunnel_encap_add_ops(&mpls_iptun_ops
, LWTUNNEL_ENCAP_MPLS
);
289 module_init(mpls_iptunnel_init
);
291 static void __exit
mpls_iptunnel_exit(void)
293 lwtunnel_encap_del_ops(&mpls_iptun_ops
, LWTUNNEL_ENCAP_MPLS
);
295 module_exit(mpls_iptunnel_exit
);
297 MODULE_ALIAS_RTNL_LWT(MPLS
);
298 MODULE_DESCRIPTION("MultiProtocol Label Switching IP Tunnels");
299 MODULE_LICENSE("GPL v2");