2 * lwtunnel Infrastructure for light weight tunnels like mpls
4 * Authors: Roopa Prabhu, <roopa@cumulusnetworks.com>
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
13 #include <linux/capability.h>
14 #include <linux/module.h>
15 #include <linux/types.h>
16 #include <linux/kernel.h>
17 #include <linux/slab.h>
18 #include <linux/uaccess.h>
19 #include <linux/skbuff.h>
20 #include <linux/netdevice.h>
21 #include <linux/lwtunnel.h>
23 #include <linux/init.h>
24 #include <linux/err.h>
26 #include <net/lwtunnel.h>
27 #include <net/rtnetlink.h>
28 #include <net/ip6_fib.h>
29 #include <net/nexthop.h>
33 static const char *lwtunnel_encap_str(enum lwtunnel_encap_types encap_type
)
35 /* Only lwt encaps implemented without using an interface for
36 * the encap need to return a string here.
39 case LWTUNNEL_ENCAP_MPLS
:
41 case LWTUNNEL_ENCAP_ILA
:
43 case LWTUNNEL_ENCAP_SEG6
:
45 case LWTUNNEL_ENCAP_BPF
:
47 case LWTUNNEL_ENCAP_IP6
:
48 case LWTUNNEL_ENCAP_IP
:
49 case LWTUNNEL_ENCAP_NONE
:
50 case __LWTUNNEL_ENCAP_MAX
:
51 /* should not have got here */
58 #endif /* CONFIG_MODULES */
60 struct lwtunnel_state
*lwtunnel_state_alloc(int encap_len
)
62 struct lwtunnel_state
*lws
;
64 lws
= kzalloc(sizeof(*lws
) + encap_len
, GFP_ATOMIC
);
68 EXPORT_SYMBOL(lwtunnel_state_alloc
);
70 static const struct lwtunnel_encap_ops __rcu
*
71 lwtun_encaps
[LWTUNNEL_ENCAP_MAX
+ 1] __read_mostly
;
73 int lwtunnel_encap_add_ops(const struct lwtunnel_encap_ops
*ops
,
76 if (num
> LWTUNNEL_ENCAP_MAX
)
79 return !cmpxchg((const struct lwtunnel_encap_ops
**)
83 EXPORT_SYMBOL(lwtunnel_encap_add_ops
);
85 int lwtunnel_encap_del_ops(const struct lwtunnel_encap_ops
*ops
,
86 unsigned int encap_type
)
90 if (encap_type
== LWTUNNEL_ENCAP_NONE
||
91 encap_type
> LWTUNNEL_ENCAP_MAX
)
94 ret
= (cmpxchg((const struct lwtunnel_encap_ops
**)
95 &lwtun_encaps
[encap_type
],
96 ops
, NULL
) == ops
) ? 0 : -1;
102 EXPORT_SYMBOL(lwtunnel_encap_del_ops
);
104 int lwtunnel_build_state(u16 encap_type
,
105 struct nlattr
*encap
, unsigned int family
,
106 const void *cfg
, struct lwtunnel_state
**lws
,
107 struct netlink_ext_ack
*extack
)
109 const struct lwtunnel_encap_ops
*ops
;
113 if (encap_type
== LWTUNNEL_ENCAP_NONE
||
114 encap_type
> LWTUNNEL_ENCAP_MAX
) {
115 NL_SET_ERR_MSG_ATTR(extack
, encap
,
116 "Unknown LWT encapsulation type");
122 ops
= rcu_dereference(lwtun_encaps
[encap_type
]);
123 if (likely(ops
&& ops
->build_state
&& try_module_get(ops
->owner
))) {
125 ret
= ops
->build_state(encap
, family
, cfg
, lws
, extack
);
127 module_put(ops
->owner
);
131 /* don't rely on -EOPNOTSUPP to detect match as build_state
132 * handlers could return it
135 NL_SET_ERR_MSG_ATTR(extack
, encap
,
136 "LWT encapsulation type not supported");
141 EXPORT_SYMBOL(lwtunnel_build_state
);
143 int lwtunnel_valid_encap_type(u16 encap_type
, struct netlink_ext_ack
*extack
)
145 const struct lwtunnel_encap_ops
*ops
;
148 if (encap_type
== LWTUNNEL_ENCAP_NONE
||
149 encap_type
> LWTUNNEL_ENCAP_MAX
) {
150 NL_SET_ERR_MSG(extack
, "Unknown lwt encapsulation type");
155 ops
= rcu_dereference(lwtun_encaps
[encap_type
]);
157 #ifdef CONFIG_MODULES
159 const char *encap_type_str
= lwtunnel_encap_str(encap_type
);
161 if (encap_type_str
) {
163 request_module("rtnl-lwt-%s", encap_type_str
);
167 ops
= rcu_dereference(lwtun_encaps
[encap_type
]);
172 ret
= ops
? 0 : -EOPNOTSUPP
;
174 NL_SET_ERR_MSG(extack
, "lwt encapsulation type not supported");
178 EXPORT_SYMBOL(lwtunnel_valid_encap_type
);
180 int lwtunnel_valid_encap_type_attr(struct nlattr
*attr
, int remaining
,
181 struct netlink_ext_ack
*extack
)
183 struct rtnexthop
*rtnh
= (struct rtnexthop
*)attr
;
184 struct nlattr
*nla_entype
;
185 struct nlattr
*attrs
;
189 while (rtnh_ok(rtnh
, remaining
)) {
190 attrlen
= rtnh_attrlen(rtnh
);
192 attrs
= rtnh_attrs(rtnh
);
193 nla_entype
= nla_find(attrs
, attrlen
, RTA_ENCAP_TYPE
);
196 encap_type
= nla_get_u16(nla_entype
);
198 if (lwtunnel_valid_encap_type(encap_type
,
203 rtnh
= rtnh_next(rtnh
, &remaining
);
208 EXPORT_SYMBOL(lwtunnel_valid_encap_type_attr
);
210 void lwtstate_free(struct lwtunnel_state
*lws
)
212 const struct lwtunnel_encap_ops
*ops
= lwtun_encaps
[lws
->type
];
214 if (ops
->destroy_state
) {
215 ops
->destroy_state(lws
);
220 module_put(ops
->owner
);
222 EXPORT_SYMBOL(lwtstate_free
);
224 int lwtunnel_fill_encap(struct sk_buff
*skb
, struct lwtunnel_state
*lwtstate
)
226 const struct lwtunnel_encap_ops
*ops
;
233 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
234 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
237 nest
= nla_nest_start(skb
, RTA_ENCAP
);
243 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
244 if (likely(ops
&& ops
->fill_encap
))
245 ret
= ops
->fill_encap(skb
, lwtstate
);
249 goto nla_put_failure
;
250 nla_nest_end(skb
, nest
);
251 ret
= nla_put_u16(skb
, RTA_ENCAP_TYPE
, lwtstate
->type
);
253 goto nla_put_failure
;
258 nla_nest_cancel(skb
, nest
);
260 return (ret
== -EOPNOTSUPP
? 0 : ret
);
262 EXPORT_SYMBOL(lwtunnel_fill_encap
);
264 int lwtunnel_get_encap_size(struct lwtunnel_state
*lwtstate
)
266 const struct lwtunnel_encap_ops
*ops
;
272 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
273 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
277 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
278 if (likely(ops
&& ops
->get_encap_size
))
279 ret
= nla_total_size(ops
->get_encap_size(lwtstate
));
284 EXPORT_SYMBOL(lwtunnel_get_encap_size
);
286 int lwtunnel_cmp_encap(struct lwtunnel_state
*a
, struct lwtunnel_state
*b
)
288 const struct lwtunnel_encap_ops
*ops
;
297 if (a
->type
!= b
->type
)
300 if (a
->type
== LWTUNNEL_ENCAP_NONE
||
301 a
->type
> LWTUNNEL_ENCAP_MAX
)
305 ops
= rcu_dereference(lwtun_encaps
[a
->type
]);
306 if (likely(ops
&& ops
->cmp_encap
))
307 ret
= ops
->cmp_encap(a
, b
);
312 EXPORT_SYMBOL(lwtunnel_cmp_encap
);
314 int lwtunnel_output(struct net
*net
, struct sock
*sk
, struct sk_buff
*skb
)
316 struct dst_entry
*dst
= skb_dst(skb
);
317 const struct lwtunnel_encap_ops
*ops
;
318 struct lwtunnel_state
*lwtstate
;
323 lwtstate
= dst
->lwtstate
;
325 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
326 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
331 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
332 if (likely(ops
&& ops
->output
))
333 ret
= ops
->output(net
, sk
, skb
);
336 if (ret
== -EOPNOTSUPP
)
346 EXPORT_SYMBOL(lwtunnel_output
);
348 int lwtunnel_xmit(struct sk_buff
*skb
)
350 struct dst_entry
*dst
= skb_dst(skb
);
351 const struct lwtunnel_encap_ops
*ops
;
352 struct lwtunnel_state
*lwtstate
;
358 lwtstate
= dst
->lwtstate
;
360 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
361 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
366 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
367 if (likely(ops
&& ops
->xmit
))
368 ret
= ops
->xmit(skb
);
371 if (ret
== -EOPNOTSUPP
)
381 EXPORT_SYMBOL(lwtunnel_xmit
);
383 int lwtunnel_input(struct sk_buff
*skb
)
385 struct dst_entry
*dst
= skb_dst(skb
);
386 const struct lwtunnel_encap_ops
*ops
;
387 struct lwtunnel_state
*lwtstate
;
392 lwtstate
= dst
->lwtstate
;
394 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
395 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
400 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
401 if (likely(ops
&& ops
->input
))
402 ret
= ops
->input(skb
);
405 if (ret
== -EOPNOTSUPP
)
415 EXPORT_SYMBOL(lwtunnel_input
);