1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * lwtunnel Infrastructure for light weight tunnels like mpls
5 * Authors: Roopa Prabhu, <roopa@cumulusnetworks.com>
8 #include <linux/capability.h>
9 #include <linux/module.h>
10 #include <linux/types.h>
11 #include <linux/kernel.h>
12 #include <linux/slab.h>
13 #include <linux/uaccess.h>
14 #include <linux/skbuff.h>
15 #include <linux/netdevice.h>
16 #include <linux/lwtunnel.h>
18 #include <linux/init.h>
19 #include <linux/err.h>
21 #include <net/lwtunnel.h>
22 #include <net/rtnetlink.h>
23 #include <net/ip6_fib.h>
28 static const char *lwtunnel_encap_str(enum lwtunnel_encap_types encap_type
)
30 /* Only lwt encaps implemented without using an interface for
31 * the encap need to return a string here.
34 case LWTUNNEL_ENCAP_MPLS
:
36 case LWTUNNEL_ENCAP_ILA
:
38 case LWTUNNEL_ENCAP_SEG6
:
40 case LWTUNNEL_ENCAP_BPF
:
42 case LWTUNNEL_ENCAP_SEG6_LOCAL
:
44 case LWTUNNEL_ENCAP_RPL
:
46 case LWTUNNEL_ENCAP_IP6
:
47 case LWTUNNEL_ENCAP_IP
:
48 case LWTUNNEL_ENCAP_NONE
:
49 case __LWTUNNEL_ENCAP_MAX
:
50 /* should not have got here */
57 #endif /* CONFIG_MODULES */
59 struct lwtunnel_state
*lwtunnel_state_alloc(int encap_len
)
61 struct lwtunnel_state
*lws
;
63 lws
= kzalloc(sizeof(*lws
) + encap_len
, GFP_ATOMIC
);
67 EXPORT_SYMBOL_GPL(lwtunnel_state_alloc
);
69 static const struct lwtunnel_encap_ops __rcu
*
70 lwtun_encaps
[LWTUNNEL_ENCAP_MAX
+ 1] __read_mostly
;
72 int lwtunnel_encap_add_ops(const struct lwtunnel_encap_ops
*ops
,
75 if (num
> LWTUNNEL_ENCAP_MAX
)
78 return !cmpxchg((const struct lwtunnel_encap_ops
**)
82 EXPORT_SYMBOL_GPL(lwtunnel_encap_add_ops
);
84 int lwtunnel_encap_del_ops(const struct lwtunnel_encap_ops
*ops
,
85 unsigned int encap_type
)
89 if (encap_type
== LWTUNNEL_ENCAP_NONE
||
90 encap_type
> LWTUNNEL_ENCAP_MAX
)
93 ret
= (cmpxchg((const struct lwtunnel_encap_ops
**)
94 &lwtun_encaps
[encap_type
],
95 ops
, NULL
) == ops
) ? 0 : -1;
101 EXPORT_SYMBOL_GPL(lwtunnel_encap_del_ops
);
103 int lwtunnel_build_state(struct net
*net
, u16 encap_type
,
104 struct nlattr
*encap
, unsigned int family
,
105 const void *cfg
, struct lwtunnel_state
**lws
,
106 struct netlink_ext_ack
*extack
)
108 const struct lwtunnel_encap_ops
*ops
;
112 if (encap_type
== LWTUNNEL_ENCAP_NONE
||
113 encap_type
> LWTUNNEL_ENCAP_MAX
) {
114 NL_SET_ERR_MSG_ATTR(extack
, encap
,
115 "Unknown LWT encapsulation type");
121 ops
= rcu_dereference(lwtun_encaps
[encap_type
]);
122 if (likely(ops
&& ops
->build_state
&& try_module_get(ops
->owner
)))
127 ret
= ops
->build_state(net
, encap
, family
, cfg
, lws
, extack
);
129 module_put(ops
->owner
);
131 /* don't rely on -EOPNOTSUPP to detect match as build_state
132 * handlers could return it
134 NL_SET_ERR_MSG_ATTR(extack
, encap
,
135 "LWT encapsulation type not supported");
140 EXPORT_SYMBOL_GPL(lwtunnel_build_state
);
142 int lwtunnel_valid_encap_type(u16 encap_type
, struct netlink_ext_ack
*extack
)
144 const struct lwtunnel_encap_ops
*ops
;
147 if (encap_type
== LWTUNNEL_ENCAP_NONE
||
148 encap_type
> LWTUNNEL_ENCAP_MAX
) {
149 NL_SET_ERR_MSG(extack
, "Unknown lwt encapsulation type");
154 ops
= rcu_dereference(lwtun_encaps
[encap_type
]);
156 #ifdef CONFIG_MODULES
158 const char *encap_type_str
= lwtunnel_encap_str(encap_type
);
160 if (encap_type_str
) {
162 request_module("rtnl-lwt-%s", encap_type_str
);
166 ops
= rcu_dereference(lwtun_encaps
[encap_type
]);
171 ret
= ops
? 0 : -EOPNOTSUPP
;
173 NL_SET_ERR_MSG(extack
, "lwt encapsulation type not supported");
177 EXPORT_SYMBOL_GPL(lwtunnel_valid_encap_type
);
179 int lwtunnel_valid_encap_type_attr(struct nlattr
*attr
, int remaining
,
180 struct netlink_ext_ack
*extack
)
182 struct rtnexthop
*rtnh
= (struct rtnexthop
*)attr
;
183 struct nlattr
*nla_entype
;
184 struct nlattr
*attrs
;
188 while (rtnh_ok(rtnh
, remaining
)) {
189 attrlen
= rtnh_attrlen(rtnh
);
191 attrs
= rtnh_attrs(rtnh
);
192 nla_entype
= nla_find(attrs
, attrlen
, RTA_ENCAP_TYPE
);
195 encap_type
= nla_get_u16(nla_entype
);
197 if (lwtunnel_valid_encap_type(encap_type
,
202 rtnh
= rtnh_next(rtnh
, &remaining
);
207 EXPORT_SYMBOL_GPL(lwtunnel_valid_encap_type_attr
);
209 void lwtstate_free(struct lwtunnel_state
*lws
)
211 const struct lwtunnel_encap_ops
*ops
= lwtun_encaps
[lws
->type
];
213 if (ops
->destroy_state
) {
214 ops
->destroy_state(lws
);
219 module_put(ops
->owner
);
221 EXPORT_SYMBOL_GPL(lwtstate_free
);
223 int lwtunnel_fill_encap(struct sk_buff
*skb
, struct lwtunnel_state
*lwtstate
,
224 int encap_attr
, int encap_type_attr
)
226 const struct lwtunnel_encap_ops
*ops
;
233 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
234 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
237 nest
= nla_nest_start_noflag(skb
, encap_attr
);
243 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
244 if (likely(ops
&& ops
->fill_encap
))
245 ret
= ops
->fill_encap(skb
, lwtstate
);
249 goto nla_put_failure
;
250 nla_nest_end(skb
, nest
);
251 ret
= nla_put_u16(skb
, encap_type_attr
, lwtstate
->type
);
253 goto nla_put_failure
;
258 nla_nest_cancel(skb
, nest
);
260 return (ret
== -EOPNOTSUPP
? 0 : ret
);
262 EXPORT_SYMBOL_GPL(lwtunnel_fill_encap
);
264 int lwtunnel_get_encap_size(struct lwtunnel_state
*lwtstate
)
266 const struct lwtunnel_encap_ops
*ops
;
272 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
273 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
277 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
278 if (likely(ops
&& ops
->get_encap_size
))
279 ret
= nla_total_size(ops
->get_encap_size(lwtstate
));
284 EXPORT_SYMBOL_GPL(lwtunnel_get_encap_size
);
286 int lwtunnel_cmp_encap(struct lwtunnel_state
*a
, struct lwtunnel_state
*b
)
288 const struct lwtunnel_encap_ops
*ops
;
297 if (a
->type
!= b
->type
)
300 if (a
->type
== LWTUNNEL_ENCAP_NONE
||
301 a
->type
> LWTUNNEL_ENCAP_MAX
)
305 ops
= rcu_dereference(lwtun_encaps
[a
->type
]);
306 if (likely(ops
&& ops
->cmp_encap
))
307 ret
= ops
->cmp_encap(a
, b
);
312 EXPORT_SYMBOL_GPL(lwtunnel_cmp_encap
);
314 int lwtunnel_output(struct net
*net
, struct sock
*sk
, struct sk_buff
*skb
)
316 struct dst_entry
*dst
= skb_dst(skb
);
317 const struct lwtunnel_encap_ops
*ops
;
318 struct lwtunnel_state
*lwtstate
;
323 lwtstate
= dst
->lwtstate
;
325 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
326 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
331 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
332 if (likely(ops
&& ops
->output
))
333 ret
= ops
->output(net
, sk
, skb
);
336 if (ret
== -EOPNOTSUPP
)
346 EXPORT_SYMBOL_GPL(lwtunnel_output
);
348 int lwtunnel_xmit(struct sk_buff
*skb
)
350 struct dst_entry
*dst
= skb_dst(skb
);
351 const struct lwtunnel_encap_ops
*ops
;
352 struct lwtunnel_state
*lwtstate
;
358 lwtstate
= dst
->lwtstate
;
360 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
361 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
366 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
367 if (likely(ops
&& ops
->xmit
))
368 ret
= ops
->xmit(skb
);
371 if (ret
== -EOPNOTSUPP
)
381 EXPORT_SYMBOL_GPL(lwtunnel_xmit
);
383 int lwtunnel_input(struct sk_buff
*skb
)
385 struct dst_entry
*dst
= skb_dst(skb
);
386 const struct lwtunnel_encap_ops
*ops
;
387 struct lwtunnel_state
*lwtstate
;
392 lwtstate
= dst
->lwtstate
;
394 if (lwtstate
->type
== LWTUNNEL_ENCAP_NONE
||
395 lwtstate
->type
> LWTUNNEL_ENCAP_MAX
)
400 ops
= rcu_dereference(lwtun_encaps
[lwtstate
->type
]);
401 if (likely(ops
&& ops
->input
))
402 ret
= ops
->input(skb
);
405 if (ret
== -EOPNOTSUPP
)
415 EXPORT_SYMBOL_GPL(lwtunnel_input
);