2 * xfrm6_policy.c: based on xfrm4_policy.c
6 * Kazunori MIYAZAWA @USAGI
7 * Kunihiro Ishiguro <kunihiro@ipinfusion.com>
10 * Split up af-specific portion
14 #include <linux/err.h>
15 #include <linux/kernel.h>
16 #include <linux/netdevice.h>
17 #include <net/addrconf.h>
22 #include <net/ip6_route.h>
23 #include <net/l3mdev.h>
24 #if IS_ENABLED(CONFIG_IPV6_MIP6)
28 static struct xfrm_policy_afinfo xfrm6_policy_afinfo
;
30 static struct dst_entry
*xfrm6_dst_lookup(struct net
*net
, int tos
, int oif
,
31 const xfrm_address_t
*saddr
,
32 const xfrm_address_t
*daddr
)
35 struct dst_entry
*dst
;
38 memset(&fl6
, 0, sizeof(fl6
));
39 fl6
.flowi6_oif
= l3mdev_master_ifindex_by_index(net
, oif
);
40 fl6
.flowi6_flags
= FLOWI_FLAG_SKIP_NH_OIF
;
41 memcpy(&fl6
.daddr
, daddr
, sizeof(fl6
.daddr
));
43 memcpy(&fl6
.saddr
, saddr
, sizeof(fl6
.saddr
));
45 dst
= ip6_route_output(net
, NULL
, &fl6
);
56 static int xfrm6_get_saddr(struct net
*net
, int oif
,
57 xfrm_address_t
*saddr
, xfrm_address_t
*daddr
)
59 struct dst_entry
*dst
;
60 struct net_device
*dev
;
62 dst
= xfrm6_dst_lookup(net
, 0, oif
, NULL
, daddr
);
66 dev
= ip6_dst_idev(dst
)->dev
;
67 ipv6_dev_get_saddr(dev_net(dev
), dev
, &daddr
->in6
, 0, &saddr
->in6
);
72 static int xfrm6_get_tos(const struct flowi
*fl
)
77 static int xfrm6_init_path(struct xfrm_dst
*path
, struct dst_entry
*dst
,
80 if (dst
->ops
->family
== AF_INET6
) {
81 struct rt6_info
*rt
= (struct rt6_info
*)dst
;
82 path
->path_cookie
= rt6_get_cookie(rt
);
85 path
->u
.rt6
.rt6i_nfheader_len
= nfheader_len
;
90 static int xfrm6_fill_dst(struct xfrm_dst
*xdst
, struct net_device
*dev
,
91 const struct flowi
*fl
)
93 struct rt6_info
*rt
= (struct rt6_info
*)xdst
->route
;
95 xdst
->u
.dst
.dev
= dev
;
98 xdst
->u
.rt6
.rt6i_idev
= in6_dev_get(dev
);
99 if (!xdst
->u
.rt6
.rt6i_idev
) {
104 /* Sheit... I remember I did this right. Apparently,
105 * it was magically lost, so this code needs audit */
106 xdst
->u
.rt6
.rt6i_flags
= rt
->rt6i_flags
& (RTF_ANYCAST
|
108 xdst
->u
.rt6
.rt6i_metric
= rt
->rt6i_metric
;
109 xdst
->u
.rt6
.rt6i_node
= rt
->rt6i_node
;
110 xdst
->route_cookie
= rt6_get_cookie(rt
);
111 xdst
->u
.rt6
.rt6i_gateway
= rt
->rt6i_gateway
;
112 xdst
->u
.rt6
.rt6i_dst
= rt
->rt6i_dst
;
113 xdst
->u
.rt6
.rt6i_src
= rt
->rt6i_src
;
119 _decode_session6(struct sk_buff
*skb
, struct flowi
*fl
, int reverse
)
121 struct flowi6
*fl6
= &fl
->u
.ip6
;
123 const struct ipv6hdr
*hdr
= ipv6_hdr(skb
);
124 u16 offset
= sizeof(*hdr
);
125 struct ipv6_opt_hdr
*exthdr
;
126 const unsigned char *nh
= skb_network_header(skb
);
127 u16 nhoff
= IP6CB(skb
)->nhoff
;
132 nhoff
= offsetof(struct ipv6hdr
, nexthdr
);
137 oif
= l3mdev_fib_oif(skb_dst(skb
)->dev
);
139 memset(fl6
, 0, sizeof(struct flowi6
));
140 fl6
->flowi6_mark
= skb
->mark
;
141 fl6
->flowi6_oif
= reverse
? skb
->skb_iif
: oif
;
143 fl6
->daddr
= reverse
? hdr
->saddr
: hdr
->daddr
;
144 fl6
->saddr
= reverse
? hdr
->daddr
: hdr
->saddr
;
146 while (nh
+ offset
+ 1 < skb
->data
||
147 pskb_may_pull(skb
, nh
+ offset
+ 1 - skb
->data
)) {
148 nh
= skb_network_header(skb
);
149 exthdr
= (struct ipv6_opt_hdr
*)(nh
+ offset
);
152 case NEXTHDR_FRAGMENT
:
154 case NEXTHDR_ROUTING
:
157 offset
+= ipv6_optlen(exthdr
);
158 nexthdr
= exthdr
->nexthdr
;
159 exthdr
= (struct ipv6_opt_hdr
*)(nh
+ offset
);
163 case IPPROTO_UDPLITE
:
167 if (!onlyproto
&& (nh
+ offset
+ 4 < skb
->data
||
168 pskb_may_pull(skb
, nh
+ offset
+ 4 - skb
->data
))) {
171 nh
= skb_network_header(skb
);
172 ports
= (__be16
*)(nh
+ offset
);
173 fl6
->fl6_sport
= ports
[!!reverse
];
174 fl6
->fl6_dport
= ports
[!reverse
];
176 fl6
->flowi6_proto
= nexthdr
;
180 if (!onlyproto
&& (nh
+ offset
+ 2 < skb
->data
||
181 pskb_may_pull(skb
, nh
+ offset
+ 2 - skb
->data
))) {
184 nh
= skb_network_header(skb
);
185 icmp
= (u8
*)(nh
+ offset
);
186 fl6
->fl6_icmp_type
= icmp
[0];
187 fl6
->fl6_icmp_code
= icmp
[1];
189 fl6
->flowi6_proto
= nexthdr
;
192 #if IS_ENABLED(CONFIG_IPV6_MIP6)
194 offset
+= ipv6_optlen(exthdr
);
195 if (!onlyproto
&& (nh
+ offset
+ 3 < skb
->data
||
196 pskb_may_pull(skb
, nh
+ offset
+ 3 - skb
->data
))) {
199 nh
= skb_network_header(skb
);
200 mh
= (struct ip6_mh
*)(nh
+ offset
);
201 fl6
->fl6_mh_type
= mh
->ip6mh_type
;
203 fl6
->flowi6_proto
= nexthdr
;
207 /* XXX Why are there these headers? */
212 fl6
->fl6_ipsec_spi
= 0;
213 fl6
->flowi6_proto
= nexthdr
;
219 static inline int xfrm6_garbage_collect(struct dst_ops
*ops
)
221 struct net
*net
= container_of(ops
, struct net
, xfrm
.xfrm6_dst_ops
);
223 xfrm6_policy_afinfo
.garbage_collect(net
);
224 return dst_entries_get_fast(ops
) > ops
->gc_thresh
* 2;
227 static void xfrm6_update_pmtu(struct dst_entry
*dst
, struct sock
*sk
,
228 struct sk_buff
*skb
, u32 mtu
)
230 struct xfrm_dst
*xdst
= (struct xfrm_dst
*)dst
;
231 struct dst_entry
*path
= xdst
->route
;
233 path
->ops
->update_pmtu(path
, sk
, skb
, mtu
);
236 static void xfrm6_redirect(struct dst_entry
*dst
, struct sock
*sk
,
239 struct xfrm_dst
*xdst
= (struct xfrm_dst
*)dst
;
240 struct dst_entry
*path
= xdst
->route
;
242 path
->ops
->redirect(path
, sk
, skb
);
245 static void xfrm6_dst_destroy(struct dst_entry
*dst
)
247 struct xfrm_dst
*xdst
= (struct xfrm_dst
*)dst
;
249 if (likely(xdst
->u
.rt6
.rt6i_idev
))
250 in6_dev_put(xdst
->u
.rt6
.rt6i_idev
);
251 dst_destroy_metrics_generic(dst
);
252 xfrm_dst_destroy(xdst
);
255 static void xfrm6_dst_ifdown(struct dst_entry
*dst
, struct net_device
*dev
,
258 struct xfrm_dst
*xdst
;
263 xdst
= (struct xfrm_dst
*)dst
;
264 if (xdst
->u
.rt6
.rt6i_idev
->dev
== dev
) {
265 struct inet6_dev
*loopback_idev
=
266 in6_dev_get(dev_net(dev
)->loopback_dev
);
267 BUG_ON(!loopback_idev
);
270 in6_dev_put(xdst
->u
.rt6
.rt6i_idev
);
271 xdst
->u
.rt6
.rt6i_idev
= loopback_idev
;
272 in6_dev_hold(loopback_idev
);
273 xdst
= (struct xfrm_dst
*)xdst
->u
.dst
.child
;
274 } while (xdst
->u
.dst
.xfrm
);
276 __in6_dev_put(loopback_idev
);
279 xfrm_dst_ifdown(dst
, dev
);
282 static struct dst_ops xfrm6_dst_ops_template
= {
284 .gc
= xfrm6_garbage_collect
,
285 .update_pmtu
= xfrm6_update_pmtu
,
286 .redirect
= xfrm6_redirect
,
287 .cow_metrics
= dst_cow_metrics_generic
,
288 .destroy
= xfrm6_dst_destroy
,
289 .ifdown
= xfrm6_dst_ifdown
,
290 .local_out
= __ip6_local_out
,
291 .gc_thresh
= INT_MAX
,
294 static struct xfrm_policy_afinfo xfrm6_policy_afinfo
= {
296 .dst_ops
= &xfrm6_dst_ops_template
,
297 .dst_lookup
= xfrm6_dst_lookup
,
298 .get_saddr
= xfrm6_get_saddr
,
299 .decode_session
= _decode_session6
,
300 .get_tos
= xfrm6_get_tos
,
301 .init_path
= xfrm6_init_path
,
302 .fill_dst
= xfrm6_fill_dst
,
303 .blackhole_route
= ip6_blackhole_route
,
306 static int __init
xfrm6_policy_init(void)
308 return xfrm_policy_register_afinfo(&xfrm6_policy_afinfo
);
311 static void xfrm6_policy_fini(void)
313 xfrm_policy_unregister_afinfo(&xfrm6_policy_afinfo
);
317 static struct ctl_table xfrm6_policy_table
[] = {
319 .procname
= "xfrm6_gc_thresh",
320 .data
= &init_net
.xfrm
.xfrm6_dst_ops
.gc_thresh
,
321 .maxlen
= sizeof(int),
323 .proc_handler
= proc_dointvec
,
328 static int __net_init
xfrm6_net_sysctl_init(struct net
*net
)
330 struct ctl_table
*table
;
331 struct ctl_table_header
*hdr
;
333 table
= xfrm6_policy_table
;
334 if (!net_eq(net
, &init_net
)) {
335 table
= kmemdup(table
, sizeof(xfrm6_policy_table
), GFP_KERNEL
);
339 table
[0].data
= &net
->xfrm
.xfrm6_dst_ops
.gc_thresh
;
342 hdr
= register_net_sysctl(net
, "net/ipv6", table
);
346 net
->ipv6
.sysctl
.xfrm6_hdr
= hdr
;
350 if (!net_eq(net
, &init_net
))
356 static void __net_exit
xfrm6_net_sysctl_exit(struct net
*net
)
358 struct ctl_table
*table
;
360 if (!net
->ipv6
.sysctl
.xfrm6_hdr
)
363 table
= net
->ipv6
.sysctl
.xfrm6_hdr
->ctl_table_arg
;
364 unregister_net_sysctl_table(net
->ipv6
.sysctl
.xfrm6_hdr
);
365 if (!net_eq(net
, &init_net
))
368 #else /* CONFIG_SYSCTL */
369 static inline int xfrm6_net_sysctl_init(struct net
*net
)
374 static inline void xfrm6_net_sysctl_exit(struct net
*net
)
379 static int __net_init
xfrm6_net_init(struct net
*net
)
383 memcpy(&net
->xfrm
.xfrm6_dst_ops
, &xfrm6_dst_ops_template
,
384 sizeof(xfrm6_dst_ops_template
));
385 ret
= dst_entries_init(&net
->xfrm
.xfrm6_dst_ops
);
389 ret
= xfrm6_net_sysctl_init(net
);
391 dst_entries_destroy(&net
->xfrm
.xfrm6_dst_ops
);
396 static void __net_exit
xfrm6_net_exit(struct net
*net
)
398 xfrm6_net_sysctl_exit(net
);
399 dst_entries_destroy(&net
->xfrm
.xfrm6_dst_ops
);
402 static struct pernet_operations xfrm6_net_ops
= {
403 .init
= xfrm6_net_init
,
404 .exit
= xfrm6_net_exit
,
407 int __init
xfrm6_init(void)
411 ret
= xfrm6_policy_init();
414 ret
= xfrm6_state_init();
418 ret
= xfrm6_protocol_init();
422 register_pernet_subsys(&xfrm6_net_ops
);
432 void xfrm6_fini(void)
434 unregister_pernet_subsys(&xfrm6_net_ops
);
435 xfrm6_protocol_fini();