1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * mpls tunnels An implementation mpls tunnels using the light weight tunnel
6 * Authors: Roopa Prabhu, <roopa@cumulusnetworks.com>
8 #include <linux/types.h>
9 #include <linux/skbuff.h>
10 #include <linux/net.h>
11 #include <linux/module.h>
12 #include <linux/mpls.h>
13 #include <linux/vmalloc.h>
16 #include <net/lwtunnel.h>
17 #include <net/netevent.h>
18 #include <net/netns/generic.h>
19 #include <net/ip6_fib.h>
20 #include <net/route.h>
21 #include <net/mpls_iptunnel.h>
22 #include <linux/mpls_iptunnel.h>
25 static const struct nla_policy mpls_iptunnel_policy
[MPLS_IPTUNNEL_MAX
+ 1] = {
26 [MPLS_IPTUNNEL_DST
] = { .len
= sizeof(u32
) },
27 [MPLS_IPTUNNEL_TTL
] = { .type
= NLA_U8
},
30 static unsigned int mpls_encap_size(struct mpls_iptunnel_encap
*en
)
32 /* The size of the layer 2.5 labels to be added for this route */
33 return en
->labels
* sizeof(struct mpls_shim_hdr
);
36 static int mpls_xmit(struct sk_buff
*skb
)
38 struct mpls_iptunnel_encap
*tun_encap_info
;
39 struct mpls_shim_hdr
*hdr
;
40 struct net_device
*out_dev
;
42 unsigned int new_header_size
;
44 struct dst_entry
*dst
= skb_dst(skb
);
45 struct rtable
*rt
= NULL
;
46 struct rt6_info
*rt6
= NULL
;
47 struct mpls_dev
*out_mdev
;
54 /* Find the output device */
56 net
= dev_net(out_dev
);
60 if (!mpls_output_possible(out_dev
) ||
61 !dst
->lwtstate
|| skb_warn_if_lro(skb
))
64 skb_forward_csum(skb
);
66 tun_encap_info
= mpls_lwtunnel_encap(dst
->lwtstate
);
68 /* Obtain the ttl using the following set of rules.
70 * LWT ttl propagation setting:
71 * - disabled => use default TTL value from LWT
72 * - enabled => use TTL value from IPv4/IPv6 header
74 * Global ttl propagation setting:
75 * - disabled => use default TTL value from global setting
76 * - enabled => use TTL value from IPv4/IPv6 header
78 if (dst
->ops
->family
== AF_INET
) {
79 if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DISABLED
)
80 ttl
= tun_encap_info
->default_ttl
;
81 else if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DEFAULT
&&
82 !net
->mpls
.ip_ttl_propagate
)
83 ttl
= net
->mpls
.default_ttl
;
85 ttl
= ip_hdr(skb
)->ttl
;
86 rt
= (struct rtable
*)dst
;
87 } else if (dst
->ops
->family
== AF_INET6
) {
88 if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DISABLED
)
89 ttl
= tun_encap_info
->default_ttl
;
90 else if (tun_encap_info
->ttl_propagate
== MPLS_TTL_PROP_DEFAULT
&&
91 !net
->mpls
.ip_ttl_propagate
)
92 ttl
= net
->mpls
.default_ttl
;
94 ttl
= ipv6_hdr(skb
)->hop_limit
;
95 rt6
= (struct rt6_info
*)dst
;
100 /* Verify the destination can hold the packet */
101 new_header_size
= mpls_encap_size(tun_encap_info
);
102 mtu
= mpls_dev_mtu(out_dev
);
103 if (mpls_pkt_too_big(skb
, mtu
- new_header_size
))
106 hh_len
= LL_RESERVED_SPACE(out_dev
);
107 if (!out_dev
->header_ops
)
110 /* Ensure there is enough space for the headers in the skb */
111 if (skb_cow(skb
, hh_len
+ new_header_size
))
114 skb_set_inner_protocol(skb
, skb
->protocol
);
115 skb_reset_inner_network_header(skb
);
117 skb_push(skb
, new_header_size
);
119 skb_reset_network_header(skb
);
122 skb
->protocol
= htons(ETH_P_MPLS_UC
);
124 /* Push the new labels */
127 for (i
= tun_encap_info
->labels
- 1; i
>= 0; i
--) {
128 hdr
[i
] = mpls_entry_encode(tun_encap_info
->label
[i
],
133 mpls_stats_inc_outucastpkts(out_dev
, skb
);
136 if (rt
->rt_gw_family
== AF_INET6
)
137 err
= neigh_xmit(NEIGH_ND_TABLE
, out_dev
, &rt
->rt_gw6
,
140 err
= neigh_xmit(NEIGH_ARP_TABLE
, out_dev
, &rt
->rt_gw4
,
143 if (ipv6_addr_v4mapped(&rt6
->rt6i_gateway
)) {
145 err
= neigh_xmit(NEIGH_ARP_TABLE
, out_dev
, &rt6
->rt6i_gateway
.s6_addr32
[3],
148 err
= neigh_xmit(NEIGH_ND_TABLE
, out_dev
, &rt6
->rt6i_gateway
,
152 net_dbg_ratelimited("%s: packet transmission failed: %d\n",
155 return LWTUNNEL_XMIT_DONE
;
158 out_mdev
= out_dev
? mpls_dev_get(out_dev
) : NULL
;
160 MPLS_INC_STATS(out_mdev
, tx_errors
);
165 static int mpls_build_state(struct net
*net
, struct nlattr
*nla
,
166 unsigned int family
, const void *cfg
,
167 struct lwtunnel_state
**ts
,
168 struct netlink_ext_ack
*extack
)
170 struct mpls_iptunnel_encap
*tun_encap_info
;
171 struct nlattr
*tb
[MPLS_IPTUNNEL_MAX
+ 1];
172 struct lwtunnel_state
*newts
;
176 ret
= nla_parse_nested_deprecated(tb
, MPLS_IPTUNNEL_MAX
, nla
,
177 mpls_iptunnel_policy
, extack
);
181 if (!tb
[MPLS_IPTUNNEL_DST
]) {
182 NL_SET_ERR_MSG(extack
, "MPLS_IPTUNNEL_DST attribute is missing");
186 /* determine number of labels */
187 if (nla_get_labels(tb
[MPLS_IPTUNNEL_DST
], MAX_NEW_LABELS
,
188 &n_labels
, NULL
, extack
))
191 newts
= lwtunnel_state_alloc(struct_size(tun_encap_info
, label
,
196 tun_encap_info
= mpls_lwtunnel_encap(newts
);
197 ret
= nla_get_labels(tb
[MPLS_IPTUNNEL_DST
], n_labels
,
198 &tun_encap_info
->labels
, tun_encap_info
->label
,
203 tun_encap_info
->ttl_propagate
= MPLS_TTL_PROP_DEFAULT
;
205 if (tb
[MPLS_IPTUNNEL_TTL
]) {
206 tun_encap_info
->default_ttl
= nla_get_u8(tb
[MPLS_IPTUNNEL_TTL
]);
207 /* TTL 0 implies propagate from IP header */
208 tun_encap_info
->ttl_propagate
= tun_encap_info
->default_ttl
?
209 MPLS_TTL_PROP_DISABLED
:
210 MPLS_TTL_PROP_ENABLED
;
213 newts
->type
= LWTUNNEL_ENCAP_MPLS
;
214 newts
->flags
|= LWTUNNEL_STATE_XMIT_REDIRECT
;
215 newts
->headroom
= mpls_encap_size(tun_encap_info
);
228 static int mpls_fill_encap_info(struct sk_buff
*skb
,
229 struct lwtunnel_state
*lwtstate
)
231 struct mpls_iptunnel_encap
*tun_encap_info
;
233 tun_encap_info
= mpls_lwtunnel_encap(lwtstate
);
235 if (nla_put_labels(skb
, MPLS_IPTUNNEL_DST
, tun_encap_info
->labels
,
236 tun_encap_info
->label
))
237 goto nla_put_failure
;
239 if (tun_encap_info
->ttl_propagate
!= MPLS_TTL_PROP_DEFAULT
&&
240 nla_put_u8(skb
, MPLS_IPTUNNEL_TTL
, tun_encap_info
->default_ttl
))
241 goto nla_put_failure
;
249 static int mpls_encap_nlsize(struct lwtunnel_state
*lwtstate
)
251 struct mpls_iptunnel_encap
*tun_encap_info
;
254 tun_encap_info
= mpls_lwtunnel_encap(lwtstate
);
256 nlsize
= nla_total_size(tun_encap_info
->labels
* 4);
258 if (tun_encap_info
->ttl_propagate
!= MPLS_TTL_PROP_DEFAULT
)
259 nlsize
+= nla_total_size(1);
264 static int mpls_encap_cmp(struct lwtunnel_state
*a
, struct lwtunnel_state
*b
)
266 struct mpls_iptunnel_encap
*a_hdr
= mpls_lwtunnel_encap(a
);
267 struct mpls_iptunnel_encap
*b_hdr
= mpls_lwtunnel_encap(b
);
270 if (a_hdr
->labels
!= b_hdr
->labels
||
271 a_hdr
->ttl_propagate
!= b_hdr
->ttl_propagate
||
272 a_hdr
->default_ttl
!= b_hdr
->default_ttl
)
275 for (l
= 0; l
< a_hdr
->labels
; l
++)
276 if (a_hdr
->label
[l
] != b_hdr
->label
[l
])
281 static const struct lwtunnel_encap_ops mpls_iptun_ops
= {
282 .build_state
= mpls_build_state
,
284 .fill_encap
= mpls_fill_encap_info
,
285 .get_encap_size
= mpls_encap_nlsize
,
286 .cmp_encap
= mpls_encap_cmp
,
287 .owner
= THIS_MODULE
,
290 static int __init
mpls_iptunnel_init(void)
292 return lwtunnel_encap_add_ops(&mpls_iptun_ops
, LWTUNNEL_ENCAP_MPLS
);
294 module_init(mpls_iptunnel_init
);
296 static void __exit
mpls_iptunnel_exit(void)
298 lwtunnel_encap_del_ops(&mpls_iptun_ops
, LWTUNNEL_ENCAP_MPLS
);
300 module_exit(mpls_iptunnel_exit
);
302 MODULE_ALIAS_RTNL_LWT(MPLS
);
303 MODULE_DESCRIPTION("MultiProtocol Label Switching IP Tunnels");
304 MODULE_LICENSE("GPL v2");