1 // SPDX-License-Identifier: GPL-2.0-only
7 * Kazunori MIYAZAWA @USAGI
8 * Kunihiro Ishiguro <kunihiro@ipinfusion.com>
10 * YOSHIFUJI Hideaki @USAGI
11 * Split up af-specific functions
12 * Derek Atkins <derek@ihtfp.com>
13 * Add UDP Encapsulation
17 #include <linux/workqueue.h>
19 #include <linux/pfkeyv2.h>
20 #include <linux/ipsec.h>
21 #include <linux/module.h>
22 #include <linux/cache.h>
23 #include <linux/audit.h>
24 #include <linux/uaccess.h>
25 #include <linux/ktime.h>
26 #include <linux/slab.h>
27 #include <linux/interrupt.h>
28 #include <linux/kernel.h>
30 #include <crypto/aead.h>
32 #include "xfrm_hash.h"
34 #define xfrm_state_deref_prot(table, net) \
35 rcu_dereference_protected((table), lockdep_is_held(&(net)->xfrm.xfrm_state_lock))
37 static void xfrm_state_gc_task(struct work_struct
*work
);
39 /* Each xfrm_state may be linked to two tables:
41 1. Hash table by (spi,daddr,ah/esp) to find SA by SPI. (input,ctl)
42 2. Hash table by (daddr,family,reqid) to find what SAs exist for given
43 destination/tunnel endpoint. (output)
46 static unsigned int xfrm_state_hashmax __read_mostly
= 1 * 1024 * 1024;
47 static __read_mostly seqcount_t xfrm_state_hash_generation
= SEQCNT_ZERO(xfrm_state_hash_generation
);
48 static struct kmem_cache
*xfrm_state_cache __ro_after_init
;
50 static DECLARE_WORK(xfrm_state_gc_work
, xfrm_state_gc_task
);
51 static HLIST_HEAD(xfrm_state_gc_list
);
53 static inline bool xfrm_state_hold_rcu(struct xfrm_state __rcu
*x
)
55 return refcount_inc_not_zero(&x
->refcnt
);
58 static inline unsigned int xfrm_dst_hash(struct net
*net
,
59 const xfrm_address_t
*daddr
,
60 const xfrm_address_t
*saddr
,
62 unsigned short family
)
64 return __xfrm_dst_hash(daddr
, saddr
, reqid
, family
, net
->xfrm
.state_hmask
);
67 static inline unsigned int xfrm_src_hash(struct net
*net
,
68 const xfrm_address_t
*daddr
,
69 const xfrm_address_t
*saddr
,
70 unsigned short family
)
72 return __xfrm_src_hash(daddr
, saddr
, family
, net
->xfrm
.state_hmask
);
75 static inline unsigned int
76 xfrm_spi_hash(struct net
*net
, const xfrm_address_t
*daddr
,
77 __be32 spi
, u8 proto
, unsigned short family
)
79 return __xfrm_spi_hash(daddr
, spi
, proto
, family
, net
->xfrm
.state_hmask
);
82 static void xfrm_hash_transfer(struct hlist_head
*list
,
83 struct hlist_head
*ndsttable
,
84 struct hlist_head
*nsrctable
,
85 struct hlist_head
*nspitable
,
86 unsigned int nhashmask
)
88 struct hlist_node
*tmp
;
91 hlist_for_each_entry_safe(x
, tmp
, list
, bydst
) {
94 h
= __xfrm_dst_hash(&x
->id
.daddr
, &x
->props
.saddr
,
95 x
->props
.reqid
, x
->props
.family
,
97 hlist_add_head_rcu(&x
->bydst
, ndsttable
+ h
);
99 h
= __xfrm_src_hash(&x
->id
.daddr
, &x
->props
.saddr
,
102 hlist_add_head_rcu(&x
->bysrc
, nsrctable
+ h
);
105 h
= __xfrm_spi_hash(&x
->id
.daddr
, x
->id
.spi
,
106 x
->id
.proto
, x
->props
.family
,
108 hlist_add_head_rcu(&x
->byspi
, nspitable
+ h
);
113 static unsigned long xfrm_hash_new_size(unsigned int state_hmask
)
115 return ((state_hmask
+ 1) << 1) * sizeof(struct hlist_head
);
118 static void xfrm_hash_resize(struct work_struct
*work
)
120 struct net
*net
= container_of(work
, struct net
, xfrm
.state_hash_work
);
121 struct hlist_head
*ndst
, *nsrc
, *nspi
, *odst
, *osrc
, *ospi
;
122 unsigned long nsize
, osize
;
123 unsigned int nhashmask
, ohashmask
;
126 nsize
= xfrm_hash_new_size(net
->xfrm
.state_hmask
);
127 ndst
= xfrm_hash_alloc(nsize
);
130 nsrc
= xfrm_hash_alloc(nsize
);
132 xfrm_hash_free(ndst
, nsize
);
135 nspi
= xfrm_hash_alloc(nsize
);
137 xfrm_hash_free(ndst
, nsize
);
138 xfrm_hash_free(nsrc
, nsize
);
142 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
143 write_seqcount_begin(&xfrm_state_hash_generation
);
145 nhashmask
= (nsize
/ sizeof(struct hlist_head
)) - 1U;
146 odst
= xfrm_state_deref_prot(net
->xfrm
.state_bydst
, net
);
147 for (i
= net
->xfrm
.state_hmask
; i
>= 0; i
--)
148 xfrm_hash_transfer(odst
+ i
, ndst
, nsrc
, nspi
, nhashmask
);
150 osrc
= xfrm_state_deref_prot(net
->xfrm
.state_bysrc
, net
);
151 ospi
= xfrm_state_deref_prot(net
->xfrm
.state_byspi
, net
);
152 ohashmask
= net
->xfrm
.state_hmask
;
154 rcu_assign_pointer(net
->xfrm
.state_bydst
, ndst
);
155 rcu_assign_pointer(net
->xfrm
.state_bysrc
, nsrc
);
156 rcu_assign_pointer(net
->xfrm
.state_byspi
, nspi
);
157 net
->xfrm
.state_hmask
= nhashmask
;
159 write_seqcount_end(&xfrm_state_hash_generation
);
160 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
162 osize
= (ohashmask
+ 1) * sizeof(struct hlist_head
);
166 xfrm_hash_free(odst
, osize
);
167 xfrm_hash_free(osrc
, osize
);
168 xfrm_hash_free(ospi
, osize
);
171 static DEFINE_SPINLOCK(xfrm_state_afinfo_lock
);
172 static struct xfrm_state_afinfo __rcu
*xfrm_state_afinfo
[NPROTO
];
174 static DEFINE_SPINLOCK(xfrm_state_gc_lock
);
176 int __xfrm_state_delete(struct xfrm_state
*x
);
178 int km_query(struct xfrm_state
*x
, struct xfrm_tmpl
*t
, struct xfrm_policy
*pol
);
179 static bool km_is_alive(const struct km_event
*c
);
180 void km_state_expired(struct xfrm_state
*x
, int hard
, u32 portid
);
182 int xfrm_register_type(const struct xfrm_type
*type
, unsigned short family
)
184 struct xfrm_state_afinfo
*afinfo
= xfrm_state_get_afinfo(family
);
188 return -EAFNOSUPPORT
;
190 #define X(afi, T, name) do { \
191 WARN_ON((afi)->type_ ## name); \
192 (afi)->type_ ## name = (T); \
195 switch (type
->proto
) {
197 X(afinfo
, type
, comp
);
203 X(afinfo
, type
, esp
);
206 X(afinfo
, type
, ipip
);
208 case IPPROTO_DSTOPTS
:
209 X(afinfo
, type
, dstopts
);
211 case IPPROTO_ROUTING
:
212 X(afinfo
, type
, routing
);
215 X(afinfo
, type
, ipip6
);
219 err
= -EPROTONOSUPPORT
;
226 EXPORT_SYMBOL(xfrm_register_type
);
228 void xfrm_unregister_type(const struct xfrm_type
*type
, unsigned short family
)
230 struct xfrm_state_afinfo
*afinfo
= xfrm_state_get_afinfo(family
);
232 if (unlikely(afinfo
== NULL
))
235 #define X(afi, T, name) do { \
236 WARN_ON((afi)->type_ ## name != (T)); \
237 (afi)->type_ ## name = NULL; \
240 switch (type
->proto
) {
242 X(afinfo
, type
, comp
);
248 X(afinfo
, type
, esp
);
251 X(afinfo
, type
, ipip
);
253 case IPPROTO_DSTOPTS
:
254 X(afinfo
, type
, dstopts
);
256 case IPPROTO_ROUTING
:
257 X(afinfo
, type
, routing
);
260 X(afinfo
, type
, ipip6
);
269 EXPORT_SYMBOL(xfrm_unregister_type
);
271 static const struct xfrm_type
*xfrm_get_type(u8 proto
, unsigned short family
)
273 const struct xfrm_type
*type
= NULL
;
274 struct xfrm_state_afinfo
*afinfo
;
275 int modload_attempted
= 0;
278 afinfo
= xfrm_state_get_afinfo(family
);
279 if (unlikely(afinfo
== NULL
))
284 type
= afinfo
->type_comp
;
287 type
= afinfo
->type_ah
;
290 type
= afinfo
->type_esp
;
293 type
= afinfo
->type_ipip
;
295 case IPPROTO_DSTOPTS
:
296 type
= afinfo
->type_dstopts
;
298 case IPPROTO_ROUTING
:
299 type
= afinfo
->type_routing
;
302 type
= afinfo
->type_ipip6
;
308 if (unlikely(type
&& !try_module_get(type
->owner
)))
313 if (!type
&& !modload_attempted
) {
314 request_module("xfrm-type-%d-%d", family
, proto
);
315 modload_attempted
= 1;
322 static void xfrm_put_type(const struct xfrm_type
*type
)
324 module_put(type
->owner
);
327 int xfrm_register_type_offload(const struct xfrm_type_offload
*type
,
328 unsigned short family
)
330 struct xfrm_state_afinfo
*afinfo
= xfrm_state_get_afinfo(family
);
333 if (unlikely(afinfo
== NULL
))
334 return -EAFNOSUPPORT
;
336 switch (type
->proto
) {
338 WARN_ON(afinfo
->type_offload_esp
);
339 afinfo
->type_offload_esp
= type
;
343 err
= -EPROTONOSUPPORT
;
350 EXPORT_SYMBOL(xfrm_register_type_offload
);
352 void xfrm_unregister_type_offload(const struct xfrm_type_offload
*type
,
353 unsigned short family
)
355 struct xfrm_state_afinfo
*afinfo
= xfrm_state_get_afinfo(family
);
357 if (unlikely(afinfo
== NULL
))
360 switch (type
->proto
) {
362 WARN_ON(afinfo
->type_offload_esp
!= type
);
363 afinfo
->type_offload_esp
= NULL
;
371 EXPORT_SYMBOL(xfrm_unregister_type_offload
);
373 static const struct xfrm_type_offload
*
374 xfrm_get_type_offload(u8 proto
, unsigned short family
, bool try_load
)
376 const struct xfrm_type_offload
*type
= NULL
;
377 struct xfrm_state_afinfo
*afinfo
;
380 afinfo
= xfrm_state_get_afinfo(family
);
381 if (unlikely(afinfo
== NULL
))
386 type
= afinfo
->type_offload_esp
;
392 if ((type
&& !try_module_get(type
->owner
)))
397 if (!type
&& try_load
) {
398 request_module("xfrm-offload-%d-%d", family
, proto
);
406 static void xfrm_put_type_offload(const struct xfrm_type_offload
*type
)
408 module_put(type
->owner
);
411 static const struct xfrm_mode xfrm4_mode_map
[XFRM_MODE_MAX
] = {
413 .encap
= XFRM_MODE_BEET
,
414 .flags
= XFRM_MODE_FLAG_TUNNEL
,
417 [XFRM_MODE_TRANSPORT
] = {
418 .encap
= XFRM_MODE_TRANSPORT
,
421 [XFRM_MODE_TUNNEL
] = {
422 .encap
= XFRM_MODE_TUNNEL
,
423 .flags
= XFRM_MODE_FLAG_TUNNEL
,
428 static const struct xfrm_mode xfrm6_mode_map
[XFRM_MODE_MAX
] = {
430 .encap
= XFRM_MODE_BEET
,
431 .flags
= XFRM_MODE_FLAG_TUNNEL
,
434 [XFRM_MODE_ROUTEOPTIMIZATION
] = {
435 .encap
= XFRM_MODE_ROUTEOPTIMIZATION
,
438 [XFRM_MODE_TRANSPORT
] = {
439 .encap
= XFRM_MODE_TRANSPORT
,
442 [XFRM_MODE_TUNNEL
] = {
443 .encap
= XFRM_MODE_TUNNEL
,
444 .flags
= XFRM_MODE_FLAG_TUNNEL
,
449 static const struct xfrm_mode
*xfrm_get_mode(unsigned int encap
, int family
)
451 const struct xfrm_mode
*mode
;
453 if (unlikely(encap
>= XFRM_MODE_MAX
))
458 mode
= &xfrm4_mode_map
[encap
];
459 if (mode
->family
== family
)
463 mode
= &xfrm6_mode_map
[encap
];
464 if (mode
->family
== family
)
474 void xfrm_state_free(struct xfrm_state
*x
)
476 kmem_cache_free(xfrm_state_cache
, x
);
478 EXPORT_SYMBOL(xfrm_state_free
);
480 static void ___xfrm_state_destroy(struct xfrm_state
*x
)
482 hrtimer_cancel(&x
->mtimer
);
483 del_timer_sync(&x
->rtimer
);
490 kfree(x
->replay_esn
);
491 kfree(x
->preplay_esn
);
493 xfrm_put_type_offload(x
->type_offload
);
495 x
->type
->destructor(x
);
496 xfrm_put_type(x
->type
);
499 put_page(x
->xfrag
.page
);
500 xfrm_dev_state_free(x
);
501 security_xfrm_state_free(x
);
505 static void xfrm_state_gc_task(struct work_struct
*work
)
507 struct xfrm_state
*x
;
508 struct hlist_node
*tmp
;
509 struct hlist_head gc_list
;
511 spin_lock_bh(&xfrm_state_gc_lock
);
512 hlist_move_list(&xfrm_state_gc_list
, &gc_list
);
513 spin_unlock_bh(&xfrm_state_gc_lock
);
517 hlist_for_each_entry_safe(x
, tmp
, &gc_list
, gclist
)
518 ___xfrm_state_destroy(x
);
521 static enum hrtimer_restart
xfrm_timer_handler(struct hrtimer
*me
)
523 struct xfrm_state
*x
= container_of(me
, struct xfrm_state
, mtimer
);
524 enum hrtimer_restart ret
= HRTIMER_NORESTART
;
525 time64_t now
= ktime_get_real_seconds();
526 time64_t next
= TIME64_MAX
;
531 if (x
->km
.state
== XFRM_STATE_DEAD
)
533 if (x
->km
.state
== XFRM_STATE_EXPIRED
)
535 if (x
->lft
.hard_add_expires_seconds
) {
536 long tmo
= x
->lft
.hard_add_expires_seconds
+
537 x
->curlft
.add_time
- now
;
539 if (x
->xflags
& XFRM_SOFT_EXPIRE
) {
540 /* enter hard expire without soft expire first?!
541 * setting a new date could trigger this.
542 * workaround: fix x->curflt.add_time by below:
544 x
->curlft
.add_time
= now
- x
->saved_tmo
- 1;
545 tmo
= x
->lft
.hard_add_expires_seconds
- x
->saved_tmo
;
552 if (x
->lft
.hard_use_expires_seconds
) {
553 long tmo
= x
->lft
.hard_use_expires_seconds
+
554 (x
->curlft
.use_time
? : now
) - now
;
562 if (x
->lft
.soft_add_expires_seconds
) {
563 long tmo
= x
->lft
.soft_add_expires_seconds
+
564 x
->curlft
.add_time
- now
;
567 x
->xflags
&= ~XFRM_SOFT_EXPIRE
;
568 } else if (tmo
< next
) {
570 x
->xflags
|= XFRM_SOFT_EXPIRE
;
574 if (x
->lft
.soft_use_expires_seconds
) {
575 long tmo
= x
->lft
.soft_use_expires_seconds
+
576 (x
->curlft
.use_time
? : now
) - now
;
585 km_state_expired(x
, 0, 0);
587 if (next
!= TIME64_MAX
) {
588 hrtimer_forward_now(&x
->mtimer
, ktime_set(next
, 0));
589 ret
= HRTIMER_RESTART
;
595 if (x
->km
.state
== XFRM_STATE_ACQ
&& x
->id
.spi
== 0)
596 x
->km
.state
= XFRM_STATE_EXPIRED
;
598 err
= __xfrm_state_delete(x
);
600 km_state_expired(x
, 1, 0);
602 xfrm_audit_state_delete(x
, err
? 0 : 1, true);
605 spin_unlock(&x
->lock
);
609 static void xfrm_replay_timer_handler(struct timer_list
*t
);
611 struct xfrm_state
*xfrm_state_alloc(struct net
*net
)
613 struct xfrm_state
*x
;
615 x
= kmem_cache_zalloc(xfrm_state_cache
, GFP_ATOMIC
);
618 write_pnet(&x
->xs_net
, net
);
619 refcount_set(&x
->refcnt
, 1);
620 atomic_set(&x
->tunnel_users
, 0);
621 INIT_LIST_HEAD(&x
->km
.all
);
622 INIT_HLIST_NODE(&x
->bydst
);
623 INIT_HLIST_NODE(&x
->bysrc
);
624 INIT_HLIST_NODE(&x
->byspi
);
625 hrtimer_init(&x
->mtimer
, CLOCK_BOOTTIME
, HRTIMER_MODE_ABS_SOFT
);
626 x
->mtimer
.function
= xfrm_timer_handler
;
627 timer_setup(&x
->rtimer
, xfrm_replay_timer_handler
, 0);
628 x
->curlft
.add_time
= ktime_get_real_seconds();
629 x
->lft
.soft_byte_limit
= XFRM_INF
;
630 x
->lft
.soft_packet_limit
= XFRM_INF
;
631 x
->lft
.hard_byte_limit
= XFRM_INF
;
632 x
->lft
.hard_packet_limit
= XFRM_INF
;
633 x
->replay_maxage
= 0;
634 x
->replay_maxdiff
= 0;
635 spin_lock_init(&x
->lock
);
639 EXPORT_SYMBOL(xfrm_state_alloc
);
641 void __xfrm_state_destroy(struct xfrm_state
*x
, bool sync
)
643 WARN_ON(x
->km
.state
!= XFRM_STATE_DEAD
);
647 ___xfrm_state_destroy(x
);
649 spin_lock_bh(&xfrm_state_gc_lock
);
650 hlist_add_head(&x
->gclist
, &xfrm_state_gc_list
);
651 spin_unlock_bh(&xfrm_state_gc_lock
);
652 schedule_work(&xfrm_state_gc_work
);
655 EXPORT_SYMBOL(__xfrm_state_destroy
);
657 int __xfrm_state_delete(struct xfrm_state
*x
)
659 struct net
*net
= xs_net(x
);
662 if (x
->km
.state
!= XFRM_STATE_DEAD
) {
663 x
->km
.state
= XFRM_STATE_DEAD
;
664 spin_lock(&net
->xfrm
.xfrm_state_lock
);
665 list_del(&x
->km
.all
);
666 hlist_del_rcu(&x
->bydst
);
667 hlist_del_rcu(&x
->bysrc
);
669 hlist_del_rcu(&x
->byspi
);
670 net
->xfrm
.state_num
--;
671 spin_unlock(&net
->xfrm
.xfrm_state_lock
);
674 sock_put(rcu_dereference_raw(x
->encap_sk
));
676 xfrm_dev_state_delete(x
);
678 /* All xfrm_state objects are created by xfrm_state_alloc.
679 * The xfrm_state_alloc call gives a reference, and that
680 * is what we are dropping here.
688 EXPORT_SYMBOL(__xfrm_state_delete
);
690 int xfrm_state_delete(struct xfrm_state
*x
)
694 spin_lock_bh(&x
->lock
);
695 err
= __xfrm_state_delete(x
);
696 spin_unlock_bh(&x
->lock
);
700 EXPORT_SYMBOL(xfrm_state_delete
);
702 #ifdef CONFIG_SECURITY_NETWORK_XFRM
704 xfrm_state_flush_secctx_check(struct net
*net
, u8 proto
, bool task_valid
)
708 for (i
= 0; i
<= net
->xfrm
.state_hmask
; i
++) {
709 struct xfrm_state
*x
;
711 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+i
, bydst
) {
712 if (xfrm_id_proto_match(x
->id
.proto
, proto
) &&
713 (err
= security_xfrm_state_delete(x
)) != 0) {
714 xfrm_audit_state_delete(x
, 0, task_valid
);
724 xfrm_dev_state_flush_secctx_check(struct net
*net
, struct net_device
*dev
, bool task_valid
)
728 for (i
= 0; i
<= net
->xfrm
.state_hmask
; i
++) {
729 struct xfrm_state
*x
;
730 struct xfrm_state_offload
*xso
;
732 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+i
, bydst
) {
735 if (xso
->dev
== dev
&&
736 (err
= security_xfrm_state_delete(x
)) != 0) {
737 xfrm_audit_state_delete(x
, 0, task_valid
);
747 xfrm_state_flush_secctx_check(struct net
*net
, u8 proto
, bool task_valid
)
753 xfrm_dev_state_flush_secctx_check(struct net
*net
, struct net_device
*dev
, bool task_valid
)
759 int xfrm_state_flush(struct net
*net
, u8 proto
, bool task_valid
, bool sync
)
761 int i
, err
= 0, cnt
= 0;
763 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
764 err
= xfrm_state_flush_secctx_check(net
, proto
, task_valid
);
769 for (i
= 0; i
<= net
->xfrm
.state_hmask
; i
++) {
770 struct xfrm_state
*x
;
772 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+i
, bydst
) {
773 if (!xfrm_state_kern(x
) &&
774 xfrm_id_proto_match(x
->id
.proto
, proto
)) {
776 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
778 err
= xfrm_state_delete(x
);
779 xfrm_audit_state_delete(x
, err
? 0 : 1,
782 xfrm_state_put_sync(x
);
788 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
794 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
800 EXPORT_SYMBOL(xfrm_state_flush
);
802 int xfrm_dev_state_flush(struct net
*net
, struct net_device
*dev
, bool task_valid
)
804 int i
, err
= 0, cnt
= 0;
806 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
807 err
= xfrm_dev_state_flush_secctx_check(net
, dev
, task_valid
);
812 for (i
= 0; i
<= net
->xfrm
.state_hmask
; i
++) {
813 struct xfrm_state
*x
;
814 struct xfrm_state_offload
*xso
;
816 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+i
, bydst
) {
819 if (!xfrm_state_kern(x
) && xso
->dev
== dev
) {
821 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
823 err
= xfrm_state_delete(x
);
824 xfrm_audit_state_delete(x
, err
? 0 : 1,
830 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
839 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
842 EXPORT_SYMBOL(xfrm_dev_state_flush
);
844 void xfrm_sad_getinfo(struct net
*net
, struct xfrmk_sadinfo
*si
)
846 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
847 si
->sadcnt
= net
->xfrm
.state_num
;
848 si
->sadhcnt
= net
->xfrm
.state_hmask
+ 1;
849 si
->sadhmcnt
= xfrm_state_hashmax
;
850 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
852 EXPORT_SYMBOL(xfrm_sad_getinfo
);
855 __xfrm4_init_tempsel(struct xfrm_selector
*sel
, const struct flowi
*fl
)
857 const struct flowi4
*fl4
= &fl
->u
.ip4
;
859 sel
->daddr
.a4
= fl4
->daddr
;
860 sel
->saddr
.a4
= fl4
->saddr
;
861 sel
->dport
= xfrm_flowi_dport(fl
, &fl4
->uli
);
862 sel
->dport_mask
= htons(0xffff);
863 sel
->sport
= xfrm_flowi_sport(fl
, &fl4
->uli
);
864 sel
->sport_mask
= htons(0xffff);
865 sel
->family
= AF_INET
;
866 sel
->prefixlen_d
= 32;
867 sel
->prefixlen_s
= 32;
868 sel
->proto
= fl4
->flowi4_proto
;
869 sel
->ifindex
= fl4
->flowi4_oif
;
873 __xfrm6_init_tempsel(struct xfrm_selector
*sel
, const struct flowi
*fl
)
875 const struct flowi6
*fl6
= &fl
->u
.ip6
;
877 /* Initialize temporary selector matching only to current session. */
878 *(struct in6_addr
*)&sel
->daddr
= fl6
->daddr
;
879 *(struct in6_addr
*)&sel
->saddr
= fl6
->saddr
;
880 sel
->dport
= xfrm_flowi_dport(fl
, &fl6
->uli
);
881 sel
->dport_mask
= htons(0xffff);
882 sel
->sport
= xfrm_flowi_sport(fl
, &fl6
->uli
);
883 sel
->sport_mask
= htons(0xffff);
884 sel
->family
= AF_INET6
;
885 sel
->prefixlen_d
= 128;
886 sel
->prefixlen_s
= 128;
887 sel
->proto
= fl6
->flowi6_proto
;
888 sel
->ifindex
= fl6
->flowi6_oif
;
892 xfrm_init_tempstate(struct xfrm_state
*x
, const struct flowi
*fl
,
893 const struct xfrm_tmpl
*tmpl
,
894 const xfrm_address_t
*daddr
, const xfrm_address_t
*saddr
,
895 unsigned short family
)
899 __xfrm4_init_tempsel(&x
->sel
, fl
);
902 __xfrm6_init_tempsel(&x
->sel
, fl
);
908 switch (tmpl
->encap_family
) {
910 if (x
->id
.daddr
.a4
== 0)
911 x
->id
.daddr
.a4
= daddr
->a4
;
912 x
->props
.saddr
= tmpl
->saddr
;
913 if (x
->props
.saddr
.a4
== 0)
914 x
->props
.saddr
.a4
= saddr
->a4
;
917 if (ipv6_addr_any((struct in6_addr
*)&x
->id
.daddr
))
918 memcpy(&x
->id
.daddr
, daddr
, sizeof(x
->sel
.daddr
));
919 memcpy(&x
->props
.saddr
, &tmpl
->saddr
, sizeof(x
->props
.saddr
));
920 if (ipv6_addr_any((struct in6_addr
*)&x
->props
.saddr
))
921 memcpy(&x
->props
.saddr
, saddr
, sizeof(x
->props
.saddr
));
925 x
->props
.mode
= tmpl
->mode
;
926 x
->props
.reqid
= tmpl
->reqid
;
927 x
->props
.family
= tmpl
->encap_family
;
930 static struct xfrm_state
*__xfrm_state_lookup(struct net
*net
, u32 mark
,
931 const xfrm_address_t
*daddr
,
932 __be32 spi
, u8 proto
,
933 unsigned short family
)
935 unsigned int h
= xfrm_spi_hash(net
, daddr
, spi
, proto
, family
);
936 struct xfrm_state
*x
;
938 hlist_for_each_entry_rcu(x
, net
->xfrm
.state_byspi
+ h
, byspi
) {
939 if (x
->props
.family
!= family
||
941 x
->id
.proto
!= proto
||
942 !xfrm_addr_equal(&x
->id
.daddr
, daddr
, family
))
945 if ((mark
& x
->mark
.m
) != x
->mark
.v
)
947 if (!xfrm_state_hold_rcu(x
))
955 static struct xfrm_state
*__xfrm_state_lookup_byaddr(struct net
*net
, u32 mark
,
956 const xfrm_address_t
*daddr
,
957 const xfrm_address_t
*saddr
,
958 u8 proto
, unsigned short family
)
960 unsigned int h
= xfrm_src_hash(net
, daddr
, saddr
, family
);
961 struct xfrm_state
*x
;
963 hlist_for_each_entry_rcu(x
, net
->xfrm
.state_bysrc
+ h
, bysrc
) {
964 if (x
->props
.family
!= family
||
965 x
->id
.proto
!= proto
||
966 !xfrm_addr_equal(&x
->id
.daddr
, daddr
, family
) ||
967 !xfrm_addr_equal(&x
->props
.saddr
, saddr
, family
))
970 if ((mark
& x
->mark
.m
) != x
->mark
.v
)
972 if (!xfrm_state_hold_rcu(x
))
980 static inline struct xfrm_state
*
981 __xfrm_state_locate(struct xfrm_state
*x
, int use_spi
, int family
)
983 struct net
*net
= xs_net(x
);
984 u32 mark
= x
->mark
.v
& x
->mark
.m
;
987 return __xfrm_state_lookup(net
, mark
, &x
->id
.daddr
,
988 x
->id
.spi
, x
->id
.proto
, family
);
990 return __xfrm_state_lookup_byaddr(net
, mark
,
993 x
->id
.proto
, family
);
996 static void xfrm_hash_grow_check(struct net
*net
, int have_hash_collision
)
998 if (have_hash_collision
&&
999 (net
->xfrm
.state_hmask
+ 1) < xfrm_state_hashmax
&&
1000 net
->xfrm
.state_num
> net
->xfrm
.state_hmask
)
1001 schedule_work(&net
->xfrm
.state_hash_work
);
1004 static void xfrm_state_look_at(struct xfrm_policy
*pol
, struct xfrm_state
*x
,
1005 const struct flowi
*fl
, unsigned short family
,
1006 struct xfrm_state
**best
, int *acq_in_progress
,
1009 /* Resolution logic:
1010 * 1. There is a valid state with matching selector. Done.
1011 * 2. Valid state with inappropriate selector. Skip.
1013 * Entering area of "sysdeps".
1015 * 3. If state is not valid, selector is temporary, it selects
1016 * only session which triggered previous resolution. Key
1017 * manager will do something to install a state with proper
1020 if (x
->km
.state
== XFRM_STATE_VALID
) {
1021 if ((x
->sel
.family
&&
1022 !xfrm_selector_match(&x
->sel
, fl
, x
->sel
.family
)) ||
1023 !security_xfrm_state_pol_flow_match(x
, pol
, fl
))
1027 (*best
)->km
.dying
> x
->km
.dying
||
1028 ((*best
)->km
.dying
== x
->km
.dying
&&
1029 (*best
)->curlft
.add_time
< x
->curlft
.add_time
))
1031 } else if (x
->km
.state
== XFRM_STATE_ACQ
) {
1032 *acq_in_progress
= 1;
1033 } else if (x
->km
.state
== XFRM_STATE_ERROR
||
1034 x
->km
.state
== XFRM_STATE_EXPIRED
) {
1035 if (xfrm_selector_match(&x
->sel
, fl
, x
->sel
.family
) &&
1036 security_xfrm_state_pol_flow_match(x
, pol
, fl
))
1042 xfrm_state_find(const xfrm_address_t
*daddr
, const xfrm_address_t
*saddr
,
1043 const struct flowi
*fl
, struct xfrm_tmpl
*tmpl
,
1044 struct xfrm_policy
*pol
, int *err
,
1045 unsigned short family
, u32 if_id
)
1047 static xfrm_address_t saddr_wildcard
= { };
1048 struct net
*net
= xp_net(pol
);
1049 unsigned int h
, h_wildcard
;
1050 struct xfrm_state
*x
, *x0
, *to_put
;
1051 int acquire_in_progress
= 0;
1053 struct xfrm_state
*best
= NULL
;
1054 u32 mark
= pol
->mark
.v
& pol
->mark
.m
;
1055 unsigned short encap_family
= tmpl
->encap_family
;
1056 unsigned int sequence
;
1061 sequence
= read_seqcount_begin(&xfrm_state_hash_generation
);
1064 h
= xfrm_dst_hash(net
, daddr
, saddr
, tmpl
->reqid
, encap_family
);
1065 hlist_for_each_entry_rcu(x
, net
->xfrm
.state_bydst
+ h
, bydst
) {
1066 if (x
->props
.family
== encap_family
&&
1067 x
->props
.reqid
== tmpl
->reqid
&&
1068 (mark
& x
->mark
.m
) == x
->mark
.v
&&
1069 x
->if_id
== if_id
&&
1070 !(x
->props
.flags
& XFRM_STATE_WILDRECV
) &&
1071 xfrm_state_addr_check(x
, daddr
, saddr
, encap_family
) &&
1072 tmpl
->mode
== x
->props
.mode
&&
1073 tmpl
->id
.proto
== x
->id
.proto
&&
1074 (tmpl
->id
.spi
== x
->id
.spi
|| !tmpl
->id
.spi
))
1075 xfrm_state_look_at(pol
, x
, fl
, encap_family
,
1076 &best
, &acquire_in_progress
, &error
);
1078 if (best
|| acquire_in_progress
)
1081 h_wildcard
= xfrm_dst_hash(net
, daddr
, &saddr_wildcard
, tmpl
->reqid
, encap_family
);
1082 hlist_for_each_entry_rcu(x
, net
->xfrm
.state_bydst
+ h_wildcard
, bydst
) {
1083 if (x
->props
.family
== encap_family
&&
1084 x
->props
.reqid
== tmpl
->reqid
&&
1085 (mark
& x
->mark
.m
) == x
->mark
.v
&&
1086 x
->if_id
== if_id
&&
1087 !(x
->props
.flags
& XFRM_STATE_WILDRECV
) &&
1088 xfrm_addr_equal(&x
->id
.daddr
, daddr
, encap_family
) &&
1089 tmpl
->mode
== x
->props
.mode
&&
1090 tmpl
->id
.proto
== x
->id
.proto
&&
1091 (tmpl
->id
.spi
== x
->id
.spi
|| !tmpl
->id
.spi
))
1092 xfrm_state_look_at(pol
, x
, fl
, encap_family
,
1093 &best
, &acquire_in_progress
, &error
);
1098 if (!x
&& !error
&& !acquire_in_progress
) {
1100 (x0
= __xfrm_state_lookup(net
, mark
, daddr
, tmpl
->id
.spi
,
1101 tmpl
->id
.proto
, encap_family
)) != NULL
) {
1108 /* If the KMs have no listeners (yet...), avoid allocating an SA
1109 * for each and every packet - garbage collection might not
1112 if (!km_is_alive(&c
)) {
1117 x
= xfrm_state_alloc(net
);
1122 /* Initialize temporary state matching only
1123 * to current session. */
1124 xfrm_init_tempstate(x
, fl
, tmpl
, daddr
, saddr
, family
);
1125 memcpy(&x
->mark
, &pol
->mark
, sizeof(x
->mark
));
1128 error
= security_xfrm_state_alloc_acquire(x
, pol
->security
, fl
->flowi_secid
);
1130 x
->km
.state
= XFRM_STATE_DEAD
;
1136 if (km_query(x
, tmpl
, pol
) == 0) {
1137 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1138 x
->km
.state
= XFRM_STATE_ACQ
;
1139 list_add(&x
->km
.all
, &net
->xfrm
.state_all
);
1140 hlist_add_head_rcu(&x
->bydst
, net
->xfrm
.state_bydst
+ h
);
1141 h
= xfrm_src_hash(net
, daddr
, saddr
, encap_family
);
1142 hlist_add_head_rcu(&x
->bysrc
, net
->xfrm
.state_bysrc
+ h
);
1144 h
= xfrm_spi_hash(net
, &x
->id
.daddr
, x
->id
.spi
, x
->id
.proto
, encap_family
);
1145 hlist_add_head_rcu(&x
->byspi
, net
->xfrm
.state_byspi
+ h
);
1147 x
->lft
.hard_add_expires_seconds
= net
->xfrm
.sysctl_acq_expires
;
1148 hrtimer_start(&x
->mtimer
,
1149 ktime_set(net
->xfrm
.sysctl_acq_expires
, 0),
1150 HRTIMER_MODE_REL_SOFT
);
1151 net
->xfrm
.state_num
++;
1152 xfrm_hash_grow_check(net
, x
->bydst
.next
!= NULL
);
1153 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1155 x
->km
.state
= XFRM_STATE_DEAD
;
1163 if (!xfrm_state_hold_rcu(x
)) {
1168 *err
= acquire_in_progress
? -EAGAIN
: error
;
1172 xfrm_state_put(to_put
);
1174 if (read_seqcount_retry(&xfrm_state_hash_generation
, sequence
)) {
1186 xfrm_stateonly_find(struct net
*net
, u32 mark
, u32 if_id
,
1187 xfrm_address_t
*daddr
, xfrm_address_t
*saddr
,
1188 unsigned short family
, u8 mode
, u8 proto
, u32 reqid
)
1191 struct xfrm_state
*rx
= NULL
, *x
= NULL
;
1193 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1194 h
= xfrm_dst_hash(net
, daddr
, saddr
, reqid
, family
);
1195 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+h
, bydst
) {
1196 if (x
->props
.family
== family
&&
1197 x
->props
.reqid
== reqid
&&
1198 (mark
& x
->mark
.m
) == x
->mark
.v
&&
1199 x
->if_id
== if_id
&&
1200 !(x
->props
.flags
& XFRM_STATE_WILDRECV
) &&
1201 xfrm_state_addr_check(x
, daddr
, saddr
, family
) &&
1202 mode
== x
->props
.mode
&&
1203 proto
== x
->id
.proto
&&
1204 x
->km
.state
== XFRM_STATE_VALID
) {
1211 xfrm_state_hold(rx
);
1212 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1217 EXPORT_SYMBOL(xfrm_stateonly_find
);
1219 struct xfrm_state
*xfrm_state_lookup_byspi(struct net
*net
, __be32 spi
,
1220 unsigned short family
)
1222 struct xfrm_state
*x
;
1223 struct xfrm_state_walk
*w
;
1225 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1226 list_for_each_entry(w
, &net
->xfrm
.state_all
, all
) {
1227 x
= container_of(w
, struct xfrm_state
, km
);
1228 if (x
->props
.family
!= family
||
1233 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1236 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1239 EXPORT_SYMBOL(xfrm_state_lookup_byspi
);
1241 static void __xfrm_state_insert(struct xfrm_state
*x
)
1243 struct net
*net
= xs_net(x
);
1246 list_add(&x
->km
.all
, &net
->xfrm
.state_all
);
1248 h
= xfrm_dst_hash(net
, &x
->id
.daddr
, &x
->props
.saddr
,
1249 x
->props
.reqid
, x
->props
.family
);
1250 hlist_add_head_rcu(&x
->bydst
, net
->xfrm
.state_bydst
+ h
);
1252 h
= xfrm_src_hash(net
, &x
->id
.daddr
, &x
->props
.saddr
, x
->props
.family
);
1253 hlist_add_head_rcu(&x
->bysrc
, net
->xfrm
.state_bysrc
+ h
);
1256 h
= xfrm_spi_hash(net
, &x
->id
.daddr
, x
->id
.spi
, x
->id
.proto
,
1259 hlist_add_head_rcu(&x
->byspi
, net
->xfrm
.state_byspi
+ h
);
1262 hrtimer_start(&x
->mtimer
, ktime_set(1, 0), HRTIMER_MODE_REL_SOFT
);
1263 if (x
->replay_maxage
)
1264 mod_timer(&x
->rtimer
, jiffies
+ x
->replay_maxage
);
1266 net
->xfrm
.state_num
++;
1268 xfrm_hash_grow_check(net
, x
->bydst
.next
!= NULL
);
1271 /* net->xfrm.xfrm_state_lock is held */
1272 static void __xfrm_state_bump_genids(struct xfrm_state
*xnew
)
1274 struct net
*net
= xs_net(xnew
);
1275 unsigned short family
= xnew
->props
.family
;
1276 u32 reqid
= xnew
->props
.reqid
;
1277 struct xfrm_state
*x
;
1279 u32 mark
= xnew
->mark
.v
& xnew
->mark
.m
;
1280 u32 if_id
= xnew
->if_id
;
1282 h
= xfrm_dst_hash(net
, &xnew
->id
.daddr
, &xnew
->props
.saddr
, reqid
, family
);
1283 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+h
, bydst
) {
1284 if (x
->props
.family
== family
&&
1285 x
->props
.reqid
== reqid
&&
1286 x
->if_id
== if_id
&&
1287 (mark
& x
->mark
.m
) == x
->mark
.v
&&
1288 xfrm_addr_equal(&x
->id
.daddr
, &xnew
->id
.daddr
, family
) &&
1289 xfrm_addr_equal(&x
->props
.saddr
, &xnew
->props
.saddr
, family
))
1294 void xfrm_state_insert(struct xfrm_state
*x
)
1296 struct net
*net
= xs_net(x
);
1298 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1299 __xfrm_state_bump_genids(x
);
1300 __xfrm_state_insert(x
);
1301 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1303 EXPORT_SYMBOL(xfrm_state_insert
);
1305 /* net->xfrm.xfrm_state_lock is held */
1306 static struct xfrm_state
*__find_acq_core(struct net
*net
,
1307 const struct xfrm_mark
*m
,
1308 unsigned short family
, u8 mode
,
1309 u32 reqid
, u32 if_id
, u8 proto
,
1310 const xfrm_address_t
*daddr
,
1311 const xfrm_address_t
*saddr
,
1314 unsigned int h
= xfrm_dst_hash(net
, daddr
, saddr
, reqid
, family
);
1315 struct xfrm_state
*x
;
1316 u32 mark
= m
->v
& m
->m
;
1318 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+h
, bydst
) {
1319 if (x
->props
.reqid
!= reqid
||
1320 x
->props
.mode
!= mode
||
1321 x
->props
.family
!= family
||
1322 x
->km
.state
!= XFRM_STATE_ACQ
||
1324 x
->id
.proto
!= proto
||
1325 (mark
& x
->mark
.m
) != x
->mark
.v
||
1326 !xfrm_addr_equal(&x
->id
.daddr
, daddr
, family
) ||
1327 !xfrm_addr_equal(&x
->props
.saddr
, saddr
, family
))
1337 x
= xfrm_state_alloc(net
);
1341 x
->sel
.daddr
.a4
= daddr
->a4
;
1342 x
->sel
.saddr
.a4
= saddr
->a4
;
1343 x
->sel
.prefixlen_d
= 32;
1344 x
->sel
.prefixlen_s
= 32;
1345 x
->props
.saddr
.a4
= saddr
->a4
;
1346 x
->id
.daddr
.a4
= daddr
->a4
;
1350 x
->sel
.daddr
.in6
= daddr
->in6
;
1351 x
->sel
.saddr
.in6
= saddr
->in6
;
1352 x
->sel
.prefixlen_d
= 128;
1353 x
->sel
.prefixlen_s
= 128;
1354 x
->props
.saddr
.in6
= saddr
->in6
;
1355 x
->id
.daddr
.in6
= daddr
->in6
;
1359 x
->km
.state
= XFRM_STATE_ACQ
;
1360 x
->id
.proto
= proto
;
1361 x
->props
.family
= family
;
1362 x
->props
.mode
= mode
;
1363 x
->props
.reqid
= reqid
;
1367 x
->lft
.hard_add_expires_seconds
= net
->xfrm
.sysctl_acq_expires
;
1369 hrtimer_start(&x
->mtimer
,
1370 ktime_set(net
->xfrm
.sysctl_acq_expires
, 0),
1371 HRTIMER_MODE_REL_SOFT
);
1372 list_add(&x
->km
.all
, &net
->xfrm
.state_all
);
1373 hlist_add_head_rcu(&x
->bydst
, net
->xfrm
.state_bydst
+ h
);
1374 h
= xfrm_src_hash(net
, daddr
, saddr
, family
);
1375 hlist_add_head_rcu(&x
->bysrc
, net
->xfrm
.state_bysrc
+ h
);
1377 net
->xfrm
.state_num
++;
1379 xfrm_hash_grow_check(net
, x
->bydst
.next
!= NULL
);
1385 static struct xfrm_state
*__xfrm_find_acq_byseq(struct net
*net
, u32 mark
, u32 seq
);
1387 int xfrm_state_add(struct xfrm_state
*x
)
1389 struct net
*net
= xs_net(x
);
1390 struct xfrm_state
*x1
, *to_put
;
1393 u32 mark
= x
->mark
.v
& x
->mark
.m
;
1394 int use_spi
= xfrm_id_proto_match(x
->id
.proto
, IPSEC_PROTO_ANY
);
1396 family
= x
->props
.family
;
1400 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1402 x1
= __xfrm_state_locate(x
, use_spi
, family
);
1410 if (use_spi
&& x
->km
.seq
) {
1411 x1
= __xfrm_find_acq_byseq(net
, mark
, x
->km
.seq
);
1412 if (x1
&& ((x1
->id
.proto
!= x
->id
.proto
) ||
1413 !xfrm_addr_equal(&x1
->id
.daddr
, &x
->id
.daddr
, family
))) {
1420 x1
= __find_acq_core(net
, &x
->mark
, family
, x
->props
.mode
,
1421 x
->props
.reqid
, x
->if_id
, x
->id
.proto
,
1422 &x
->id
.daddr
, &x
->props
.saddr
, 0);
1424 __xfrm_state_bump_genids(x
);
1425 __xfrm_state_insert(x
);
1429 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1432 xfrm_state_delete(x1
);
1437 xfrm_state_put(to_put
);
1441 EXPORT_SYMBOL(xfrm_state_add
);
1443 #ifdef CONFIG_XFRM_MIGRATE
1444 static struct xfrm_state
*xfrm_state_clone(struct xfrm_state
*orig
,
1445 struct xfrm_encap_tmpl
*encap
)
1447 struct net
*net
= xs_net(orig
);
1448 struct xfrm_state
*x
= xfrm_state_alloc(net
);
1452 memcpy(&x
->id
, &orig
->id
, sizeof(x
->id
));
1453 memcpy(&x
->sel
, &orig
->sel
, sizeof(x
->sel
));
1454 memcpy(&x
->lft
, &orig
->lft
, sizeof(x
->lft
));
1455 x
->props
.mode
= orig
->props
.mode
;
1456 x
->props
.replay_window
= orig
->props
.replay_window
;
1457 x
->props
.reqid
= orig
->props
.reqid
;
1458 x
->props
.family
= orig
->props
.family
;
1459 x
->props
.saddr
= orig
->props
.saddr
;
1462 x
->aalg
= xfrm_algo_auth_clone(orig
->aalg
);
1466 x
->props
.aalgo
= orig
->props
.aalgo
;
1469 x
->aead
= xfrm_algo_aead_clone(orig
->aead
);
1470 x
->geniv
= orig
->geniv
;
1475 x
->ealg
= xfrm_algo_clone(orig
->ealg
);
1479 x
->props
.ealgo
= orig
->props
.ealgo
;
1482 x
->calg
= xfrm_algo_clone(orig
->calg
);
1486 x
->props
.calgo
= orig
->props
.calgo
;
1488 if (encap
|| orig
->encap
) {
1490 x
->encap
= kmemdup(encap
, sizeof(*x
->encap
),
1493 x
->encap
= kmemdup(orig
->encap
, sizeof(*x
->encap
),
1501 x
->coaddr
= kmemdup(orig
->coaddr
, sizeof(*x
->coaddr
),
1507 if (orig
->replay_esn
) {
1508 if (xfrm_replay_clone(x
, orig
))
1512 memcpy(&x
->mark
, &orig
->mark
, sizeof(x
->mark
));
1514 if (xfrm_init_state(x
) < 0)
1517 x
->props
.flags
= orig
->props
.flags
;
1518 x
->props
.extra_flags
= orig
->props
.extra_flags
;
1520 x
->if_id
= orig
->if_id
;
1521 x
->tfcpad
= orig
->tfcpad
;
1522 x
->replay_maxdiff
= orig
->replay_maxdiff
;
1523 x
->replay_maxage
= orig
->replay_maxage
;
1524 x
->curlft
.add_time
= orig
->curlft
.add_time
;
1525 x
->km
.state
= orig
->km
.state
;
1526 x
->km
.seq
= orig
->km
.seq
;
1527 x
->replay
= orig
->replay
;
1528 x
->preplay
= orig
->preplay
;
1538 struct xfrm_state
*xfrm_migrate_state_find(struct xfrm_migrate
*m
, struct net
*net
)
1541 struct xfrm_state
*x
= NULL
;
1543 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1546 h
= xfrm_dst_hash(net
, &m
->old_daddr
, &m
->old_saddr
,
1547 m
->reqid
, m
->old_family
);
1548 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+h
, bydst
) {
1549 if (x
->props
.mode
!= m
->mode
||
1550 x
->id
.proto
!= m
->proto
)
1552 if (m
->reqid
&& x
->props
.reqid
!= m
->reqid
)
1554 if (!xfrm_addr_equal(&x
->id
.daddr
, &m
->old_daddr
,
1556 !xfrm_addr_equal(&x
->props
.saddr
, &m
->old_saddr
,
1563 h
= xfrm_src_hash(net
, &m
->old_daddr
, &m
->old_saddr
,
1565 hlist_for_each_entry(x
, net
->xfrm
.state_bysrc
+h
, bysrc
) {
1566 if (x
->props
.mode
!= m
->mode
||
1567 x
->id
.proto
!= m
->proto
)
1569 if (!xfrm_addr_equal(&x
->id
.daddr
, &m
->old_daddr
,
1571 !xfrm_addr_equal(&x
->props
.saddr
, &m
->old_saddr
,
1579 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1583 EXPORT_SYMBOL(xfrm_migrate_state_find
);
1585 struct xfrm_state
*xfrm_state_migrate(struct xfrm_state
*x
,
1586 struct xfrm_migrate
*m
,
1587 struct xfrm_encap_tmpl
*encap
)
1589 struct xfrm_state
*xc
;
1591 xc
= xfrm_state_clone(x
, encap
);
1595 memcpy(&xc
->id
.daddr
, &m
->new_daddr
, sizeof(xc
->id
.daddr
));
1596 memcpy(&xc
->props
.saddr
, &m
->new_saddr
, sizeof(xc
->props
.saddr
));
1599 if (xfrm_addr_equal(&x
->id
.daddr
, &m
->new_daddr
, m
->new_family
)) {
1600 /* a care is needed when the destination address of the
1601 state is to be updated as it is a part of triplet */
1602 xfrm_state_insert(xc
);
1604 if (xfrm_state_add(xc
) < 0)
1613 EXPORT_SYMBOL(xfrm_state_migrate
);
1616 int xfrm_state_update(struct xfrm_state
*x
)
1618 struct xfrm_state
*x1
, *to_put
;
1620 int use_spi
= xfrm_id_proto_match(x
->id
.proto
, IPSEC_PROTO_ANY
);
1621 struct net
*net
= xs_net(x
);
1625 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1626 x1
= __xfrm_state_locate(x
, use_spi
, x
->props
.family
);
1632 if (xfrm_state_kern(x1
)) {
1638 if (x1
->km
.state
== XFRM_STATE_ACQ
) {
1639 __xfrm_state_insert(x
);
1645 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1648 xfrm_state_put(to_put
);
1654 xfrm_state_delete(x1
);
1660 spin_lock_bh(&x1
->lock
);
1661 if (likely(x1
->km
.state
== XFRM_STATE_VALID
)) {
1662 if (x
->encap
&& x1
->encap
&&
1663 x
->encap
->encap_type
== x1
->encap
->encap_type
)
1664 memcpy(x1
->encap
, x
->encap
, sizeof(*x1
->encap
));
1665 else if (x
->encap
|| x1
->encap
)
1668 if (x
->coaddr
&& x1
->coaddr
) {
1669 memcpy(x1
->coaddr
, x
->coaddr
, sizeof(*x1
->coaddr
));
1671 if (!use_spi
&& memcmp(&x1
->sel
, &x
->sel
, sizeof(x1
->sel
)))
1672 memcpy(&x1
->sel
, &x
->sel
, sizeof(x1
->sel
));
1673 memcpy(&x1
->lft
, &x
->lft
, sizeof(x1
->lft
));
1676 hrtimer_start(&x1
->mtimer
, ktime_set(1, 0),
1677 HRTIMER_MODE_REL_SOFT
);
1678 if (x1
->curlft
.use_time
)
1679 xfrm_state_check_expire(x1
);
1681 if (x
->props
.smark
.m
|| x
->props
.smark
.v
|| x
->if_id
) {
1682 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1684 if (x
->props
.smark
.m
|| x
->props
.smark
.v
)
1685 x1
->props
.smark
= x
->props
.smark
;
1688 x1
->if_id
= x
->if_id
;
1690 __xfrm_state_bump_genids(x1
);
1691 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1695 x
->km
.state
= XFRM_STATE_DEAD
;
1696 __xfrm_state_put(x
);
1700 spin_unlock_bh(&x1
->lock
);
1706 EXPORT_SYMBOL(xfrm_state_update
);
1708 int xfrm_state_check_expire(struct xfrm_state
*x
)
1710 if (!x
->curlft
.use_time
)
1711 x
->curlft
.use_time
= ktime_get_real_seconds();
1713 if (x
->curlft
.bytes
>= x
->lft
.hard_byte_limit
||
1714 x
->curlft
.packets
>= x
->lft
.hard_packet_limit
) {
1715 x
->km
.state
= XFRM_STATE_EXPIRED
;
1716 hrtimer_start(&x
->mtimer
, 0, HRTIMER_MODE_REL_SOFT
);
1721 (x
->curlft
.bytes
>= x
->lft
.soft_byte_limit
||
1722 x
->curlft
.packets
>= x
->lft
.soft_packet_limit
)) {
1724 km_state_expired(x
, 0, 0);
1728 EXPORT_SYMBOL(xfrm_state_check_expire
);
1731 xfrm_state_lookup(struct net
*net
, u32 mark
, const xfrm_address_t
*daddr
, __be32 spi
,
1732 u8 proto
, unsigned short family
)
1734 struct xfrm_state
*x
;
1737 x
= __xfrm_state_lookup(net
, mark
, daddr
, spi
, proto
, family
);
1741 EXPORT_SYMBOL(xfrm_state_lookup
);
1744 xfrm_state_lookup_byaddr(struct net
*net
, u32 mark
,
1745 const xfrm_address_t
*daddr
, const xfrm_address_t
*saddr
,
1746 u8 proto
, unsigned short family
)
1748 struct xfrm_state
*x
;
1750 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1751 x
= __xfrm_state_lookup_byaddr(net
, mark
, daddr
, saddr
, proto
, family
);
1752 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1755 EXPORT_SYMBOL(xfrm_state_lookup_byaddr
);
1758 xfrm_find_acq(struct net
*net
, const struct xfrm_mark
*mark
, u8 mode
, u32 reqid
,
1759 u32 if_id
, u8 proto
, const xfrm_address_t
*daddr
,
1760 const xfrm_address_t
*saddr
, int create
, unsigned short family
)
1762 struct xfrm_state
*x
;
1764 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1765 x
= __find_acq_core(net
, mark
, family
, mode
, reqid
, if_id
, proto
, daddr
, saddr
, create
);
1766 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1770 EXPORT_SYMBOL(xfrm_find_acq
);
1772 #ifdef CONFIG_XFRM_SUB_POLICY
1773 #if IS_ENABLED(CONFIG_IPV6)
1774 /* distribution counting sort function for xfrm_state and xfrm_tmpl */
1776 __xfrm6_sort(void **dst
, void **src
, int n
,
1777 int (*cmp
)(const void *p
), int maxclass
)
1779 int count
[XFRM_MAX_DEPTH
] = { };
1780 int class[XFRM_MAX_DEPTH
];
1783 for (i
= 0; i
< n
; i
++) {
1784 int c
= cmp(src
[i
]);
1790 for (i
= 2; i
< maxclass
; i
++)
1791 count
[i
] += count
[i
- 1];
1793 for (i
= 0; i
< n
; i
++) {
1794 dst
[count
[class[i
] - 1]++] = src
[i
];
1799 /* Rule for xfrm_state:
1801 * rule 1: select IPsec transport except AH
1802 * rule 2: select MIPv6 RO or inbound trigger
1803 * rule 3: select IPsec transport AH
1804 * rule 4: select IPsec tunnel
1807 static int __xfrm6_state_sort_cmp(const void *p
)
1809 const struct xfrm_state
*v
= p
;
1811 switch (v
->props
.mode
) {
1812 case XFRM_MODE_TRANSPORT
:
1813 if (v
->id
.proto
!= IPPROTO_AH
)
1817 #if IS_ENABLED(CONFIG_IPV6_MIP6)
1818 case XFRM_MODE_ROUTEOPTIMIZATION
:
1819 case XFRM_MODE_IN_TRIGGER
:
1822 case XFRM_MODE_TUNNEL
:
1823 case XFRM_MODE_BEET
:
1829 /* Rule for xfrm_tmpl:
1831 * rule 1: select IPsec transport
1832 * rule 2: select MIPv6 RO or inbound trigger
1833 * rule 3: select IPsec tunnel
1836 static int __xfrm6_tmpl_sort_cmp(const void *p
)
1838 const struct xfrm_tmpl
*v
= p
;
1841 case XFRM_MODE_TRANSPORT
:
1843 #if IS_ENABLED(CONFIG_IPV6_MIP6)
1844 case XFRM_MODE_ROUTEOPTIMIZATION
:
1845 case XFRM_MODE_IN_TRIGGER
:
1848 case XFRM_MODE_TUNNEL
:
1849 case XFRM_MODE_BEET
:
1855 static inline int __xfrm6_state_sort_cmp(const void *p
) { return 5; }
1856 static inline int __xfrm6_tmpl_sort_cmp(const void *p
) { return 4; }
1859 __xfrm6_sort(void **dst
, void **src
, int n
,
1860 int (*cmp
)(const void *p
), int maxclass
)
1864 for (i
= 0; i
< n
; i
++)
1867 #endif /* CONFIG_IPV6 */
1870 xfrm_tmpl_sort(struct xfrm_tmpl
**dst
, struct xfrm_tmpl
**src
, int n
,
1871 unsigned short family
)
1875 if (family
== AF_INET6
)
1876 __xfrm6_sort((void **)dst
, (void **)src
, n
,
1877 __xfrm6_tmpl_sort_cmp
, 5);
1879 for (i
= 0; i
< n
; i
++)
1884 xfrm_state_sort(struct xfrm_state
**dst
, struct xfrm_state
**src
, int n
,
1885 unsigned short family
)
1889 if (family
== AF_INET6
)
1890 __xfrm6_sort((void **)dst
, (void **)src
, n
,
1891 __xfrm6_state_sort_cmp
, 6);
1893 for (i
= 0; i
< n
; i
++)
1898 /* Silly enough, but I'm lazy to build resolution list */
1900 static struct xfrm_state
*__xfrm_find_acq_byseq(struct net
*net
, u32 mark
, u32 seq
)
1904 for (i
= 0; i
<= net
->xfrm
.state_hmask
; i
++) {
1905 struct xfrm_state
*x
;
1907 hlist_for_each_entry(x
, net
->xfrm
.state_bydst
+i
, bydst
) {
1908 if (x
->km
.seq
== seq
&&
1909 (mark
& x
->mark
.m
) == x
->mark
.v
&&
1910 x
->km
.state
== XFRM_STATE_ACQ
) {
1919 struct xfrm_state
*xfrm_find_acq_byseq(struct net
*net
, u32 mark
, u32 seq
)
1921 struct xfrm_state
*x
;
1923 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
1924 x
= __xfrm_find_acq_byseq(net
, mark
, seq
);
1925 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
1928 EXPORT_SYMBOL(xfrm_find_acq_byseq
);
1930 u32
xfrm_get_acqseq(void)
1933 static atomic_t acqseq
;
1936 res
= atomic_inc_return(&acqseq
);
1941 EXPORT_SYMBOL(xfrm_get_acqseq
);
1943 int verify_spi_info(u8 proto
, u32 min
, u32 max
)
1951 /* IPCOMP spi is 16-bits. */
1965 EXPORT_SYMBOL(verify_spi_info
);
1967 int xfrm_alloc_spi(struct xfrm_state
*x
, u32 low
, u32 high
)
1969 struct net
*net
= xs_net(x
);
1971 struct xfrm_state
*x0
;
1973 __be32 minspi
= htonl(low
);
1974 __be32 maxspi
= htonl(high
);
1975 u32 mark
= x
->mark
.v
& x
->mark
.m
;
1977 spin_lock_bh(&x
->lock
);
1978 if (x
->km
.state
== XFRM_STATE_DEAD
)
1987 if (minspi
== maxspi
) {
1988 x0
= xfrm_state_lookup(net
, mark
, &x
->id
.daddr
, minspi
, x
->id
.proto
, x
->props
.family
);
1996 for (h
= 0; h
< high
-low
+1; h
++) {
1997 spi
= low
+ prandom_u32()%(high
-low
+1);
1998 x0
= xfrm_state_lookup(net
, mark
, &x
->id
.daddr
, htonl(spi
), x
->id
.proto
, x
->props
.family
);
2000 x
->id
.spi
= htonl(spi
);
2007 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
2008 h
= xfrm_spi_hash(net
, &x
->id
.daddr
, x
->id
.spi
, x
->id
.proto
, x
->props
.family
);
2009 hlist_add_head_rcu(&x
->byspi
, net
->xfrm
.state_byspi
+ h
);
2010 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
2016 spin_unlock_bh(&x
->lock
);
2020 EXPORT_SYMBOL(xfrm_alloc_spi
);
2022 static bool __xfrm_state_filter_match(struct xfrm_state
*x
,
2023 struct xfrm_address_filter
*filter
)
2026 if ((filter
->family
== AF_INET
||
2027 filter
->family
== AF_INET6
) &&
2028 x
->props
.family
!= filter
->family
)
2031 return addr_match(&x
->props
.saddr
, &filter
->saddr
,
2033 addr_match(&x
->id
.daddr
, &filter
->daddr
,
2039 int xfrm_state_walk(struct net
*net
, struct xfrm_state_walk
*walk
,
2040 int (*func
)(struct xfrm_state
*, int, void*),
2043 struct xfrm_state
*state
;
2044 struct xfrm_state_walk
*x
;
2047 if (walk
->seq
!= 0 && list_empty(&walk
->all
))
2050 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
2051 if (list_empty(&walk
->all
))
2052 x
= list_first_entry(&net
->xfrm
.state_all
, struct xfrm_state_walk
, all
);
2054 x
= list_first_entry(&walk
->all
, struct xfrm_state_walk
, all
);
2055 list_for_each_entry_from(x
, &net
->xfrm
.state_all
, all
) {
2056 if (x
->state
== XFRM_STATE_DEAD
)
2058 state
= container_of(x
, struct xfrm_state
, km
);
2059 if (!xfrm_id_proto_match(state
->id
.proto
, walk
->proto
))
2061 if (!__xfrm_state_filter_match(state
, walk
->filter
))
2063 err
= func(state
, walk
->seq
, data
);
2065 list_move_tail(&walk
->all
, &x
->all
);
2070 if (walk
->seq
== 0) {
2074 list_del_init(&walk
->all
);
2076 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
2079 EXPORT_SYMBOL(xfrm_state_walk
);
2081 void xfrm_state_walk_init(struct xfrm_state_walk
*walk
, u8 proto
,
2082 struct xfrm_address_filter
*filter
)
2084 INIT_LIST_HEAD(&walk
->all
);
2085 walk
->proto
= proto
;
2086 walk
->state
= XFRM_STATE_DEAD
;
2088 walk
->filter
= filter
;
2090 EXPORT_SYMBOL(xfrm_state_walk_init
);
2092 void xfrm_state_walk_done(struct xfrm_state_walk
*walk
, struct net
*net
)
2094 kfree(walk
->filter
);
2096 if (list_empty(&walk
->all
))
2099 spin_lock_bh(&net
->xfrm
.xfrm_state_lock
);
2100 list_del(&walk
->all
);
2101 spin_unlock_bh(&net
->xfrm
.xfrm_state_lock
);
2103 EXPORT_SYMBOL(xfrm_state_walk_done
);
2105 static void xfrm_replay_timer_handler(struct timer_list
*t
)
2107 struct xfrm_state
*x
= from_timer(x
, t
, rtimer
);
2109 spin_lock(&x
->lock
);
2111 if (x
->km
.state
== XFRM_STATE_VALID
) {
2112 if (xfrm_aevent_is_on(xs_net(x
)))
2113 x
->repl
->notify(x
, XFRM_REPLAY_TIMEOUT
);
2115 x
->xflags
|= XFRM_TIME_DEFER
;
2118 spin_unlock(&x
->lock
);
2121 static LIST_HEAD(xfrm_km_list
);
2123 void km_policy_notify(struct xfrm_policy
*xp
, int dir
, const struct km_event
*c
)
2125 struct xfrm_mgr
*km
;
2128 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
)
2129 if (km
->notify_policy
)
2130 km
->notify_policy(xp
, dir
, c
);
2134 void km_state_notify(struct xfrm_state
*x
, const struct km_event
*c
)
2136 struct xfrm_mgr
*km
;
2138 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
)
2144 EXPORT_SYMBOL(km_policy_notify
);
2145 EXPORT_SYMBOL(km_state_notify
);
2147 void km_state_expired(struct xfrm_state
*x
, int hard
, u32 portid
)
2153 c
.event
= XFRM_MSG_EXPIRE
;
2154 km_state_notify(x
, &c
);
2157 EXPORT_SYMBOL(km_state_expired
);
2159 * We send to all registered managers regardless of failure
2160 * We are happy with one success
2162 int km_query(struct xfrm_state
*x
, struct xfrm_tmpl
*t
, struct xfrm_policy
*pol
)
2164 int err
= -EINVAL
, acqret
;
2165 struct xfrm_mgr
*km
;
2168 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
) {
2169 acqret
= km
->acquire(x
, t
, pol
);
2176 EXPORT_SYMBOL(km_query
);
2178 int km_new_mapping(struct xfrm_state
*x
, xfrm_address_t
*ipaddr
, __be16 sport
)
2181 struct xfrm_mgr
*km
;
2184 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
) {
2185 if (km
->new_mapping
)
2186 err
= km
->new_mapping(x
, ipaddr
, sport
);
2193 EXPORT_SYMBOL(km_new_mapping
);
2195 void km_policy_expired(struct xfrm_policy
*pol
, int dir
, int hard
, u32 portid
)
2201 c
.event
= XFRM_MSG_POLEXPIRE
;
2202 km_policy_notify(pol
, dir
, &c
);
2204 EXPORT_SYMBOL(km_policy_expired
);
2206 #ifdef CONFIG_XFRM_MIGRATE
2207 int km_migrate(const struct xfrm_selector
*sel
, u8 dir
, u8 type
,
2208 const struct xfrm_migrate
*m
, int num_migrate
,
2209 const struct xfrm_kmaddress
*k
,
2210 const struct xfrm_encap_tmpl
*encap
)
2214 struct xfrm_mgr
*km
;
2217 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
) {
2219 ret
= km
->migrate(sel
, dir
, type
, m
, num_migrate
, k
,
2228 EXPORT_SYMBOL(km_migrate
);
2231 int km_report(struct net
*net
, u8 proto
, struct xfrm_selector
*sel
, xfrm_address_t
*addr
)
2235 struct xfrm_mgr
*km
;
2238 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
) {
2240 ret
= km
->report(net
, proto
, sel
, addr
);
2248 EXPORT_SYMBOL(km_report
);
2250 static bool km_is_alive(const struct km_event
*c
)
2252 struct xfrm_mgr
*km
;
2253 bool is_alive
= false;
2256 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
) {
2257 if (km
->is_alive
&& km
->is_alive(c
)) {
2267 int xfrm_user_policy(struct sock
*sk
, int optname
, u8 __user
*optval
, int optlen
)
2271 struct xfrm_mgr
*km
;
2272 struct xfrm_policy
*pol
= NULL
;
2274 if (in_compat_syscall())
2277 if (!optval
&& !optlen
) {
2278 xfrm_sk_policy_insert(sk
, XFRM_POLICY_IN
, NULL
);
2279 xfrm_sk_policy_insert(sk
, XFRM_POLICY_OUT
, NULL
);
2284 if (optlen
<= 0 || optlen
> PAGE_SIZE
)
2287 data
= memdup_user(optval
, optlen
);
2289 return PTR_ERR(data
);
2293 list_for_each_entry_rcu(km
, &xfrm_km_list
, list
) {
2294 pol
= km
->compile_policy(sk
, optname
, data
,
2302 xfrm_sk_policy_insert(sk
, err
, pol
);
2311 EXPORT_SYMBOL(xfrm_user_policy
);
2313 static DEFINE_SPINLOCK(xfrm_km_lock
);
2315 int xfrm_register_km(struct xfrm_mgr
*km
)
2317 spin_lock_bh(&xfrm_km_lock
);
2318 list_add_tail_rcu(&km
->list
, &xfrm_km_list
);
2319 spin_unlock_bh(&xfrm_km_lock
);
2322 EXPORT_SYMBOL(xfrm_register_km
);
2324 int xfrm_unregister_km(struct xfrm_mgr
*km
)
2326 spin_lock_bh(&xfrm_km_lock
);
2327 list_del_rcu(&km
->list
);
2328 spin_unlock_bh(&xfrm_km_lock
);
2332 EXPORT_SYMBOL(xfrm_unregister_km
);
2334 int xfrm_state_register_afinfo(struct xfrm_state_afinfo
*afinfo
)
2338 if (WARN_ON(afinfo
->family
>= NPROTO
))
2339 return -EAFNOSUPPORT
;
2341 spin_lock_bh(&xfrm_state_afinfo_lock
);
2342 if (unlikely(xfrm_state_afinfo
[afinfo
->family
] != NULL
))
2345 rcu_assign_pointer(xfrm_state_afinfo
[afinfo
->family
], afinfo
);
2346 spin_unlock_bh(&xfrm_state_afinfo_lock
);
2349 EXPORT_SYMBOL(xfrm_state_register_afinfo
);
2351 int xfrm_state_unregister_afinfo(struct xfrm_state_afinfo
*afinfo
)
2353 int err
= 0, family
= afinfo
->family
;
2355 if (WARN_ON(family
>= NPROTO
))
2356 return -EAFNOSUPPORT
;
2358 spin_lock_bh(&xfrm_state_afinfo_lock
);
2359 if (likely(xfrm_state_afinfo
[afinfo
->family
] != NULL
)) {
2360 if (rcu_access_pointer(xfrm_state_afinfo
[family
]) != afinfo
)
2363 RCU_INIT_POINTER(xfrm_state_afinfo
[afinfo
->family
], NULL
);
2365 spin_unlock_bh(&xfrm_state_afinfo_lock
);
2369 EXPORT_SYMBOL(xfrm_state_unregister_afinfo
);
2371 struct xfrm_state_afinfo
*xfrm_state_afinfo_get_rcu(unsigned int family
)
2373 if (unlikely(family
>= NPROTO
))
2376 return rcu_dereference(xfrm_state_afinfo
[family
]);
2378 EXPORT_SYMBOL_GPL(xfrm_state_afinfo_get_rcu
);
2380 struct xfrm_state_afinfo
*xfrm_state_get_afinfo(unsigned int family
)
2382 struct xfrm_state_afinfo
*afinfo
;
2383 if (unlikely(family
>= NPROTO
))
2386 afinfo
= rcu_dereference(xfrm_state_afinfo
[family
]);
2387 if (unlikely(!afinfo
))
2392 void xfrm_flush_gc(void)
2394 flush_work(&xfrm_state_gc_work
);
2396 EXPORT_SYMBOL(xfrm_flush_gc
);
2398 /* Temporarily located here until net/xfrm/xfrm_tunnel.c is created */
2399 void xfrm_state_delete_tunnel(struct xfrm_state
*x
)
2402 struct xfrm_state
*t
= x
->tunnel
;
2404 if (atomic_read(&t
->tunnel_users
) == 2)
2405 xfrm_state_delete(t
);
2406 atomic_dec(&t
->tunnel_users
);
2407 xfrm_state_put_sync(t
);
2411 EXPORT_SYMBOL(xfrm_state_delete_tunnel
);
2413 u32
xfrm_state_mtu(struct xfrm_state
*x
, int mtu
)
2415 const struct xfrm_type
*type
= READ_ONCE(x
->type
);
2416 struct crypto_aead
*aead
;
2417 u32 blksize
, net_adj
= 0;
2419 if (x
->km
.state
!= XFRM_STATE_VALID
||
2420 !type
|| type
->proto
!= IPPROTO_ESP
)
2421 return mtu
- x
->props
.header_len
;
2424 blksize
= ALIGN(crypto_aead_blocksize(aead
), 4);
2426 switch (x
->props
.mode
) {
2427 case XFRM_MODE_TRANSPORT
:
2428 case XFRM_MODE_BEET
:
2429 if (x
->props
.family
== AF_INET
)
2430 net_adj
= sizeof(struct iphdr
);
2431 else if (x
->props
.family
== AF_INET6
)
2432 net_adj
= sizeof(struct ipv6hdr
);
2434 case XFRM_MODE_TUNNEL
:
2441 return ((mtu
- x
->props
.header_len
- crypto_aead_authsize(aead
) -
2442 net_adj
) & ~(blksize
- 1)) + net_adj
- 2;
2444 EXPORT_SYMBOL_GPL(xfrm_state_mtu
);
2446 int __xfrm_init_state(struct xfrm_state
*x
, bool init_replay
, bool offload
)
2448 const struct xfrm_mode
*inner_mode
;
2449 const struct xfrm_mode
*outer_mode
;
2450 int family
= x
->props
.family
;
2453 if (family
== AF_INET
&&
2454 xs_net(x
)->ipv4
.sysctl_ip_no_pmtu_disc
)
2455 x
->props
.flags
|= XFRM_STATE_NOPMTUDISC
;
2457 err
= -EPROTONOSUPPORT
;
2459 if (x
->sel
.family
!= AF_UNSPEC
) {
2460 inner_mode
= xfrm_get_mode(x
->props
.mode
, x
->sel
.family
);
2461 if (inner_mode
== NULL
)
2464 if (!(inner_mode
->flags
& XFRM_MODE_FLAG_TUNNEL
) &&
2465 family
!= x
->sel
.family
)
2468 x
->inner_mode
= *inner_mode
;
2470 const struct xfrm_mode
*inner_mode_iaf
;
2471 int iafamily
= AF_INET
;
2473 inner_mode
= xfrm_get_mode(x
->props
.mode
, x
->props
.family
);
2474 if (inner_mode
== NULL
)
2477 if (!(inner_mode
->flags
& XFRM_MODE_FLAG_TUNNEL
))
2480 x
->inner_mode
= *inner_mode
;
2482 if (x
->props
.family
== AF_INET
)
2483 iafamily
= AF_INET6
;
2485 inner_mode_iaf
= xfrm_get_mode(x
->props
.mode
, iafamily
);
2486 if (inner_mode_iaf
) {
2487 if (inner_mode_iaf
->flags
& XFRM_MODE_FLAG_TUNNEL
)
2488 x
->inner_mode_iaf
= *inner_mode_iaf
;
2492 x
->type
= xfrm_get_type(x
->id
.proto
, family
);
2493 if (x
->type
== NULL
)
2496 x
->type_offload
= xfrm_get_type_offload(x
->id
.proto
, family
, offload
);
2498 err
= x
->type
->init_state(x
);
2502 outer_mode
= xfrm_get_mode(x
->props
.mode
, family
);
2504 err
= -EPROTONOSUPPORT
;
2508 x
->outer_mode
= *outer_mode
;
2510 err
= xfrm_init_replay(x
);
2519 EXPORT_SYMBOL(__xfrm_init_state
);
2521 int xfrm_init_state(struct xfrm_state
*x
)
2525 err
= __xfrm_init_state(x
, true, false);
2527 x
->km
.state
= XFRM_STATE_VALID
;
2532 EXPORT_SYMBOL(xfrm_init_state
);
2534 int __net_init
xfrm_state_init(struct net
*net
)
2538 if (net_eq(net
, &init_net
))
2539 xfrm_state_cache
= KMEM_CACHE(xfrm_state
,
2540 SLAB_HWCACHE_ALIGN
| SLAB_PANIC
);
2542 INIT_LIST_HEAD(&net
->xfrm
.state_all
);
2544 sz
= sizeof(struct hlist_head
) * 8;
2546 net
->xfrm
.state_bydst
= xfrm_hash_alloc(sz
);
2547 if (!net
->xfrm
.state_bydst
)
2549 net
->xfrm
.state_bysrc
= xfrm_hash_alloc(sz
);
2550 if (!net
->xfrm
.state_bysrc
)
2552 net
->xfrm
.state_byspi
= xfrm_hash_alloc(sz
);
2553 if (!net
->xfrm
.state_byspi
)
2555 net
->xfrm
.state_hmask
= ((sz
/ sizeof(struct hlist_head
)) - 1);
2557 net
->xfrm
.state_num
= 0;
2558 INIT_WORK(&net
->xfrm
.state_hash_work
, xfrm_hash_resize
);
2559 spin_lock_init(&net
->xfrm
.xfrm_state_lock
);
2563 xfrm_hash_free(net
->xfrm
.state_bysrc
, sz
);
2565 xfrm_hash_free(net
->xfrm
.state_bydst
, sz
);
2570 void xfrm_state_fini(struct net
*net
)
2574 flush_work(&net
->xfrm
.state_hash_work
);
2575 flush_work(&xfrm_state_gc_work
);
2576 xfrm_state_flush(net
, 0, false, true);
2578 WARN_ON(!list_empty(&net
->xfrm
.state_all
));
2580 sz
= (net
->xfrm
.state_hmask
+ 1) * sizeof(struct hlist_head
);
2581 WARN_ON(!hlist_empty(net
->xfrm
.state_byspi
));
2582 xfrm_hash_free(net
->xfrm
.state_byspi
, sz
);
2583 WARN_ON(!hlist_empty(net
->xfrm
.state_bysrc
));
2584 xfrm_hash_free(net
->xfrm
.state_bysrc
, sz
);
2585 WARN_ON(!hlist_empty(net
->xfrm
.state_bydst
));
2586 xfrm_hash_free(net
->xfrm
.state_bydst
, sz
);
2589 #ifdef CONFIG_AUDITSYSCALL
2590 static void xfrm_audit_helper_sainfo(struct xfrm_state
*x
,
2591 struct audit_buffer
*audit_buf
)
2593 struct xfrm_sec_ctx
*ctx
= x
->security
;
2594 u32 spi
= ntohl(x
->id
.spi
);
2597 audit_log_format(audit_buf
, " sec_alg=%u sec_doi=%u sec_obj=%s",
2598 ctx
->ctx_alg
, ctx
->ctx_doi
, ctx
->ctx_str
);
2600 switch (x
->props
.family
) {
2602 audit_log_format(audit_buf
, " src=%pI4 dst=%pI4",
2603 &x
->props
.saddr
.a4
, &x
->id
.daddr
.a4
);
2606 audit_log_format(audit_buf
, " src=%pI6 dst=%pI6",
2607 x
->props
.saddr
.a6
, x
->id
.daddr
.a6
);
2611 audit_log_format(audit_buf
, " spi=%u(0x%x)", spi
, spi
);
2614 static void xfrm_audit_helper_pktinfo(struct sk_buff
*skb
, u16 family
,
2615 struct audit_buffer
*audit_buf
)
2617 const struct iphdr
*iph4
;
2618 const struct ipv6hdr
*iph6
;
2623 audit_log_format(audit_buf
, " src=%pI4 dst=%pI4",
2624 &iph4
->saddr
, &iph4
->daddr
);
2627 iph6
= ipv6_hdr(skb
);
2628 audit_log_format(audit_buf
,
2629 " src=%pI6 dst=%pI6 flowlbl=0x%x%02x%02x",
2630 &iph6
->saddr
, &iph6
->daddr
,
2631 iph6
->flow_lbl
[0] & 0x0f,
2638 void xfrm_audit_state_add(struct xfrm_state
*x
, int result
, bool task_valid
)
2640 struct audit_buffer
*audit_buf
;
2642 audit_buf
= xfrm_audit_start("SAD-add");
2643 if (audit_buf
== NULL
)
2645 xfrm_audit_helper_usrinfo(task_valid
, audit_buf
);
2646 xfrm_audit_helper_sainfo(x
, audit_buf
);
2647 audit_log_format(audit_buf
, " res=%u", result
);
2648 audit_log_end(audit_buf
);
2650 EXPORT_SYMBOL_GPL(xfrm_audit_state_add
);
2652 void xfrm_audit_state_delete(struct xfrm_state
*x
, int result
, bool task_valid
)
2654 struct audit_buffer
*audit_buf
;
2656 audit_buf
= xfrm_audit_start("SAD-delete");
2657 if (audit_buf
== NULL
)
2659 xfrm_audit_helper_usrinfo(task_valid
, audit_buf
);
2660 xfrm_audit_helper_sainfo(x
, audit_buf
);
2661 audit_log_format(audit_buf
, " res=%u", result
);
2662 audit_log_end(audit_buf
);
2664 EXPORT_SYMBOL_GPL(xfrm_audit_state_delete
);
2666 void xfrm_audit_state_replay_overflow(struct xfrm_state
*x
,
2667 struct sk_buff
*skb
)
2669 struct audit_buffer
*audit_buf
;
2672 audit_buf
= xfrm_audit_start("SA-replay-overflow");
2673 if (audit_buf
== NULL
)
2675 xfrm_audit_helper_pktinfo(skb
, x
->props
.family
, audit_buf
);
2676 /* don't record the sequence number because it's inherent in this kind
2677 * of audit message */
2678 spi
= ntohl(x
->id
.spi
);
2679 audit_log_format(audit_buf
, " spi=%u(0x%x)", spi
, spi
);
2680 audit_log_end(audit_buf
);
2682 EXPORT_SYMBOL_GPL(xfrm_audit_state_replay_overflow
);
2684 void xfrm_audit_state_replay(struct xfrm_state
*x
,
2685 struct sk_buff
*skb
, __be32 net_seq
)
2687 struct audit_buffer
*audit_buf
;
2690 audit_buf
= xfrm_audit_start("SA-replayed-pkt");
2691 if (audit_buf
== NULL
)
2693 xfrm_audit_helper_pktinfo(skb
, x
->props
.family
, audit_buf
);
2694 spi
= ntohl(x
->id
.spi
);
2695 audit_log_format(audit_buf
, " spi=%u(0x%x) seqno=%u",
2696 spi
, spi
, ntohl(net_seq
));
2697 audit_log_end(audit_buf
);
2699 EXPORT_SYMBOL_GPL(xfrm_audit_state_replay
);
2701 void xfrm_audit_state_notfound_simple(struct sk_buff
*skb
, u16 family
)
2703 struct audit_buffer
*audit_buf
;
2705 audit_buf
= xfrm_audit_start("SA-notfound");
2706 if (audit_buf
== NULL
)
2708 xfrm_audit_helper_pktinfo(skb
, family
, audit_buf
);
2709 audit_log_end(audit_buf
);
2711 EXPORT_SYMBOL_GPL(xfrm_audit_state_notfound_simple
);
2713 void xfrm_audit_state_notfound(struct sk_buff
*skb
, u16 family
,
2714 __be32 net_spi
, __be32 net_seq
)
2716 struct audit_buffer
*audit_buf
;
2719 audit_buf
= xfrm_audit_start("SA-notfound");
2720 if (audit_buf
== NULL
)
2722 xfrm_audit_helper_pktinfo(skb
, family
, audit_buf
);
2723 spi
= ntohl(net_spi
);
2724 audit_log_format(audit_buf
, " spi=%u(0x%x) seqno=%u",
2725 spi
, spi
, ntohl(net_seq
));
2726 audit_log_end(audit_buf
);
2728 EXPORT_SYMBOL_GPL(xfrm_audit_state_notfound
);
2730 void xfrm_audit_state_icvfail(struct xfrm_state
*x
,
2731 struct sk_buff
*skb
, u8 proto
)
2733 struct audit_buffer
*audit_buf
;
2737 audit_buf
= xfrm_audit_start("SA-icv-failure");
2738 if (audit_buf
== NULL
)
2740 xfrm_audit_helper_pktinfo(skb
, x
->props
.family
, audit_buf
);
2741 if (xfrm_parse_spi(skb
, proto
, &net_spi
, &net_seq
) == 0) {
2742 u32 spi
= ntohl(net_spi
);
2743 audit_log_format(audit_buf
, " spi=%u(0x%x) seqno=%u",
2744 spi
, spi
, ntohl(net_seq
));
2746 audit_log_end(audit_buf
);
2748 EXPORT_SYMBOL_GPL(xfrm_audit_state_icvfail
);
2749 #endif /* CONFIG_AUDITSYSCALL */