2 * (C) 2012 by Pablo Neira Ayuso <pablo@netfilter.org>
3 * (C) 2012 by Vyatta Inc. <http://www.vyatta.com>
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License version 2 as
7 * published by the Free Software Foundation (or any later at your option).
9 #include <linux/init.h>
10 #include <linux/module.h>
11 #include <linux/kernel.h>
12 #include <linux/rculist.h>
13 #include <linux/rculist_nulls.h>
14 #include <linux/types.h>
15 #include <linux/timer.h>
16 #include <linux/security.h>
17 #include <linux/skbuff.h>
18 #include <linux/errno.h>
19 #include <linux/netlink.h>
20 #include <linux/spinlock.h>
21 #include <linux/interrupt.h>
22 #include <linux/slab.h>
24 #include <linux/netfilter.h>
25 #include <net/netlink.h>
27 #include <net/netfilter/nf_conntrack.h>
28 #include <net/netfilter/nf_conntrack_core.h>
29 #include <net/netfilter/nf_conntrack_l3proto.h>
30 #include <net/netfilter/nf_conntrack_l4proto.h>
31 #include <net/netfilter/nf_conntrack_tuple.h>
32 #include <net/netfilter/nf_conntrack_timeout.h>
34 #include <linux/netfilter/nfnetlink.h>
35 #include <linux/netfilter/nfnetlink_cttimeout.h>
37 MODULE_LICENSE("GPL");
38 MODULE_AUTHOR("Pablo Neira Ayuso <pablo@netfilter.org>");
39 MODULE_DESCRIPTION("cttimeout: Extended Netfilter Connection Tracking timeout tuning");
41 static const struct nla_policy cttimeout_nla_policy
[CTA_TIMEOUT_MAX
+1] = {
42 [CTA_TIMEOUT_NAME
] = { .type
= NLA_NUL_STRING
,
43 .len
= CTNL_TIMEOUT_NAME_MAX
- 1},
44 [CTA_TIMEOUT_L3PROTO
] = { .type
= NLA_U16
},
45 [CTA_TIMEOUT_L4PROTO
] = { .type
= NLA_U8
},
46 [CTA_TIMEOUT_DATA
] = { .type
= NLA_NESTED
},
50 ctnl_timeout_parse_policy(void *timeouts
,
51 const struct nf_conntrack_l4proto
*l4proto
,
52 struct net
*net
, const struct nlattr
*attr
)
56 if (likely(l4proto
->ctnl_timeout
.nlattr_to_obj
)) {
57 struct nlattr
*tb
[l4proto
->ctnl_timeout
.nlattr_max
+1];
59 ret
= nla_parse_nested(tb
, l4proto
->ctnl_timeout
.nlattr_max
,
60 attr
, l4proto
->ctnl_timeout
.nla_policy
,
65 ret
= l4proto
->ctnl_timeout
.nlattr_to_obj(tb
, net
, timeouts
);
70 static int cttimeout_new_timeout(struct net
*net
, struct sock
*ctnl
,
72 const struct nlmsghdr
*nlh
,
73 const struct nlattr
* const cda
[],
74 struct netlink_ext_ack
*extack
)
78 const struct nf_conntrack_l4proto
*l4proto
;
79 struct ctnl_timeout
*timeout
, *matching
= NULL
;
83 if (!cda
[CTA_TIMEOUT_NAME
] ||
84 !cda
[CTA_TIMEOUT_L3PROTO
] ||
85 !cda
[CTA_TIMEOUT_L4PROTO
] ||
86 !cda
[CTA_TIMEOUT_DATA
])
89 name
= nla_data(cda
[CTA_TIMEOUT_NAME
]);
90 l3num
= ntohs(nla_get_be16(cda
[CTA_TIMEOUT_L3PROTO
]));
91 l4num
= nla_get_u8(cda
[CTA_TIMEOUT_L4PROTO
]);
93 list_for_each_entry(timeout
, &net
->nfct_timeout_list
, head
) {
94 if (strncmp(timeout
->name
, name
, CTNL_TIMEOUT_NAME_MAX
) != 0)
97 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
105 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
) {
106 /* You cannot replace one timeout policy by another of
107 * different kind, sorry.
109 if (matching
->l3num
!= l3num
||
110 matching
->l4proto
->l4proto
!= l4num
)
113 return ctnl_timeout_parse_policy(&matching
->data
,
114 matching
->l4proto
, net
,
115 cda
[CTA_TIMEOUT_DATA
]);
121 l4proto
= nf_ct_l4proto_find_get(l3num
, l4num
);
123 /* This protocol is not supportted, skip. */
124 if (l4proto
->l4proto
!= l4num
) {
129 timeout
= kzalloc(sizeof(struct ctnl_timeout
) +
130 l4proto
->ctnl_timeout
.obj_size
, GFP_KERNEL
);
131 if (timeout
== NULL
) {
136 ret
= ctnl_timeout_parse_policy(&timeout
->data
, l4proto
, net
,
137 cda
[CTA_TIMEOUT_DATA
]);
141 strcpy(timeout
->name
, nla_data(cda
[CTA_TIMEOUT_NAME
]));
142 timeout
->l3num
= l3num
;
143 timeout
->l4proto
= l4proto
;
144 refcount_set(&timeout
->refcnt
, 1);
145 list_add_tail_rcu(&timeout
->head
, &net
->nfct_timeout_list
);
151 nf_ct_l4proto_put(l4proto
);
156 ctnl_timeout_fill_info(struct sk_buff
*skb
, u32 portid
, u32 seq
, u32 type
,
157 int event
, struct ctnl_timeout
*timeout
)
159 struct nlmsghdr
*nlh
;
160 struct nfgenmsg
*nfmsg
;
161 unsigned int flags
= portid
? NLM_F_MULTI
: 0;
162 const struct nf_conntrack_l4proto
*l4proto
= timeout
->l4proto
;
164 event
= nfnl_msg_type(NFNL_SUBSYS_CTNETLINK_TIMEOUT
, event
);
165 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(*nfmsg
), flags
);
169 nfmsg
= nlmsg_data(nlh
);
170 nfmsg
->nfgen_family
= AF_UNSPEC
;
171 nfmsg
->version
= NFNETLINK_V0
;
174 if (nla_put_string(skb
, CTA_TIMEOUT_NAME
, timeout
->name
) ||
175 nla_put_be16(skb
, CTA_TIMEOUT_L3PROTO
, htons(timeout
->l3num
)) ||
176 nla_put_u8(skb
, CTA_TIMEOUT_L4PROTO
, timeout
->l4proto
->l4proto
) ||
177 nla_put_be32(skb
, CTA_TIMEOUT_USE
,
178 htonl(refcount_read(&timeout
->refcnt
))))
179 goto nla_put_failure
;
181 if (likely(l4proto
->ctnl_timeout
.obj_to_nlattr
)) {
182 struct nlattr
*nest_parms
;
185 nest_parms
= nla_nest_start(skb
,
186 CTA_TIMEOUT_DATA
| NLA_F_NESTED
);
188 goto nla_put_failure
;
190 ret
= l4proto
->ctnl_timeout
.obj_to_nlattr(skb
, &timeout
->data
);
192 goto nla_put_failure
;
194 nla_nest_end(skb
, nest_parms
);
202 nlmsg_cancel(skb
, nlh
);
207 ctnl_timeout_dump(struct sk_buff
*skb
, struct netlink_callback
*cb
)
209 struct net
*net
= sock_net(skb
->sk
);
210 struct ctnl_timeout
*cur
, *last
;
215 last
= (struct ctnl_timeout
*)cb
->args
[1];
220 list_for_each_entry_rcu(cur
, &net
->nfct_timeout_list
, head
) {
227 if (ctnl_timeout_fill_info(skb
, NETLINK_CB(cb
->skb
).portid
,
229 NFNL_MSG_TYPE(cb
->nlh
->nlmsg_type
),
230 IPCTNL_MSG_TIMEOUT_NEW
, cur
) < 0) {
231 cb
->args
[1] = (unsigned long)cur
;
241 static int cttimeout_get_timeout(struct net
*net
, struct sock
*ctnl
,
243 const struct nlmsghdr
*nlh
,
244 const struct nlattr
* const cda
[],
245 struct netlink_ext_ack
*extack
)
249 struct ctnl_timeout
*cur
;
251 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
252 struct netlink_dump_control c
= {
253 .dump
= ctnl_timeout_dump
,
255 return netlink_dump_start(ctnl
, skb
, nlh
, &c
);
258 if (!cda
[CTA_TIMEOUT_NAME
])
260 name
= nla_data(cda
[CTA_TIMEOUT_NAME
]);
262 list_for_each_entry(cur
, &net
->nfct_timeout_list
, head
) {
263 struct sk_buff
*skb2
;
265 if (strncmp(cur
->name
, name
, CTNL_TIMEOUT_NAME_MAX
) != 0)
268 skb2
= nlmsg_new(NLMSG_DEFAULT_SIZE
, GFP_KERNEL
);
274 ret
= ctnl_timeout_fill_info(skb2
, NETLINK_CB(skb
).portid
,
276 NFNL_MSG_TYPE(nlh
->nlmsg_type
),
277 IPCTNL_MSG_TIMEOUT_NEW
, cur
);
282 ret
= netlink_unicast(ctnl
, skb2
, NETLINK_CB(skb
).portid
,
287 /* this avoids a loop in nfnetlink. */
288 return ret
== -EAGAIN
? -ENOBUFS
: ret
;
293 static int untimeout(struct nf_conn
*ct
, void *timeout
)
295 struct nf_conn_timeout
*timeout_ext
= nf_ct_timeout_find(ct
);
297 if (timeout_ext
&& (!timeout
|| timeout_ext
->timeout
== timeout
))
298 RCU_INIT_POINTER(timeout_ext
->timeout
, NULL
);
300 /* We are not intended to delete this conntrack. */
304 static void ctnl_untimeout(struct net
*net
, struct ctnl_timeout
*timeout
)
306 nf_ct_iterate_cleanup_net(net
, untimeout
, timeout
, 0, 0);
309 /* try to delete object, fail if it is still in use. */
310 static int ctnl_timeout_try_del(struct net
*net
, struct ctnl_timeout
*timeout
)
314 /* We want to avoid races with ctnl_timeout_put. So only when the
315 * current refcnt is 1, we decrease it to 0.
317 if (refcount_dec_if_one(&timeout
->refcnt
)) {
318 /* We are protected by nfnl mutex. */
319 list_del_rcu(&timeout
->head
);
320 nf_ct_l4proto_put(timeout
->l4proto
);
321 ctnl_untimeout(net
, timeout
);
322 kfree_rcu(timeout
, rcu_head
);
329 static int cttimeout_del_timeout(struct net
*net
, struct sock
*ctnl
,
331 const struct nlmsghdr
*nlh
,
332 const struct nlattr
* const cda
[],
333 struct netlink_ext_ack
*extack
)
335 struct ctnl_timeout
*cur
, *tmp
;
339 if (!cda
[CTA_TIMEOUT_NAME
]) {
340 list_for_each_entry_safe(cur
, tmp
, &net
->nfct_timeout_list
,
342 ctnl_timeout_try_del(net
, cur
);
346 name
= nla_data(cda
[CTA_TIMEOUT_NAME
]);
348 list_for_each_entry(cur
, &net
->nfct_timeout_list
, head
) {
349 if (strncmp(cur
->name
, name
, CTNL_TIMEOUT_NAME_MAX
) != 0)
352 ret
= ctnl_timeout_try_del(net
, cur
);
361 static int cttimeout_default_set(struct net
*net
, struct sock
*ctnl
,
363 const struct nlmsghdr
*nlh
,
364 const struct nlattr
* const cda
[],
365 struct netlink_ext_ack
*extack
)
367 const struct nf_conntrack_l4proto
*l4proto
;
368 unsigned int *timeouts
;
373 if (!cda
[CTA_TIMEOUT_L3PROTO
] ||
374 !cda
[CTA_TIMEOUT_L4PROTO
] ||
375 !cda
[CTA_TIMEOUT_DATA
])
378 l3num
= ntohs(nla_get_be16(cda
[CTA_TIMEOUT_L3PROTO
]));
379 l4num
= nla_get_u8(cda
[CTA_TIMEOUT_L4PROTO
]);
380 l4proto
= nf_ct_l4proto_find_get(l3num
, l4num
);
382 /* This protocol is not supported, skip. */
383 if (l4proto
->l4proto
!= l4num
) {
388 timeouts
= l4proto
->get_timeouts(net
);
390 ret
= ctnl_timeout_parse_policy(timeouts
, l4proto
, net
,
391 cda
[CTA_TIMEOUT_DATA
]);
395 nf_ct_l4proto_put(l4proto
);
398 nf_ct_l4proto_put(l4proto
);
403 cttimeout_default_fill_info(struct net
*net
, struct sk_buff
*skb
, u32 portid
,
404 u32 seq
, u32 type
, int event
,
405 const struct nf_conntrack_l4proto
*l4proto
)
407 struct nlmsghdr
*nlh
;
408 struct nfgenmsg
*nfmsg
;
409 unsigned int flags
= portid
? NLM_F_MULTI
: 0;
411 event
= nfnl_msg_type(NFNL_SUBSYS_CTNETLINK_TIMEOUT
, event
);
412 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(*nfmsg
), flags
);
416 nfmsg
= nlmsg_data(nlh
);
417 nfmsg
->nfgen_family
= AF_UNSPEC
;
418 nfmsg
->version
= NFNETLINK_V0
;
421 if (nla_put_be16(skb
, CTA_TIMEOUT_L3PROTO
, htons(l4proto
->l3proto
)) ||
422 nla_put_u8(skb
, CTA_TIMEOUT_L4PROTO
, l4proto
->l4proto
))
423 goto nla_put_failure
;
425 if (likely(l4proto
->ctnl_timeout
.obj_to_nlattr
)) {
426 struct nlattr
*nest_parms
;
427 unsigned int *timeouts
= l4proto
->get_timeouts(net
);
430 nest_parms
= nla_nest_start(skb
,
431 CTA_TIMEOUT_DATA
| NLA_F_NESTED
);
433 goto nla_put_failure
;
435 ret
= l4proto
->ctnl_timeout
.obj_to_nlattr(skb
, timeouts
);
437 goto nla_put_failure
;
439 nla_nest_end(skb
, nest_parms
);
447 nlmsg_cancel(skb
, nlh
);
451 static int cttimeout_default_get(struct net
*net
, struct sock
*ctnl
,
453 const struct nlmsghdr
*nlh
,
454 const struct nlattr
* const cda
[],
455 struct netlink_ext_ack
*extack
)
457 const struct nf_conntrack_l4proto
*l4proto
;
458 struct sk_buff
*skb2
;
463 if (!cda
[CTA_TIMEOUT_L3PROTO
] || !cda
[CTA_TIMEOUT_L4PROTO
])
466 l3num
= ntohs(nla_get_be16(cda
[CTA_TIMEOUT_L3PROTO
]));
467 l4num
= nla_get_u8(cda
[CTA_TIMEOUT_L4PROTO
]);
468 l4proto
= nf_ct_l4proto_find_get(l3num
, l4num
);
470 /* This protocol is not supported, skip. */
471 if (l4proto
->l4proto
!= l4num
) {
476 skb2
= nlmsg_new(NLMSG_DEFAULT_SIZE
, GFP_KERNEL
);
482 ret
= cttimeout_default_fill_info(net
, skb2
, NETLINK_CB(skb
).portid
,
484 NFNL_MSG_TYPE(nlh
->nlmsg_type
),
485 IPCTNL_MSG_TIMEOUT_DEFAULT_SET
,
492 ret
= netlink_unicast(ctnl
, skb2
, NETLINK_CB(skb
).portid
, MSG_DONTWAIT
);
496 /* this avoids a loop in nfnetlink. */
497 return ret
== -EAGAIN
? -ENOBUFS
: ret
;
499 nf_ct_l4proto_put(l4proto
);
503 #ifdef CONFIG_NF_CONNTRACK_TIMEOUT
504 static struct ctnl_timeout
*
505 ctnl_timeout_find_get(struct net
*net
, const char *name
)
507 struct ctnl_timeout
*timeout
, *matching
= NULL
;
509 list_for_each_entry_rcu(timeout
, &net
->nfct_timeout_list
, head
) {
510 if (strncmp(timeout
->name
, name
, CTNL_TIMEOUT_NAME_MAX
) != 0)
513 if (!try_module_get(THIS_MODULE
))
516 if (!refcount_inc_not_zero(&timeout
->refcnt
)) {
517 module_put(THIS_MODULE
);
527 static void ctnl_timeout_put(struct ctnl_timeout
*timeout
)
529 if (refcount_dec_and_test(&timeout
->refcnt
))
530 kfree_rcu(timeout
, rcu_head
);
532 module_put(THIS_MODULE
);
534 #endif /* CONFIG_NF_CONNTRACK_TIMEOUT */
536 static const struct nfnl_callback cttimeout_cb
[IPCTNL_MSG_TIMEOUT_MAX
] = {
537 [IPCTNL_MSG_TIMEOUT_NEW
] = { .call
= cttimeout_new_timeout
,
538 .attr_count
= CTA_TIMEOUT_MAX
,
539 .policy
= cttimeout_nla_policy
},
540 [IPCTNL_MSG_TIMEOUT_GET
] = { .call
= cttimeout_get_timeout
,
541 .attr_count
= CTA_TIMEOUT_MAX
,
542 .policy
= cttimeout_nla_policy
},
543 [IPCTNL_MSG_TIMEOUT_DELETE
] = { .call
= cttimeout_del_timeout
,
544 .attr_count
= CTA_TIMEOUT_MAX
,
545 .policy
= cttimeout_nla_policy
},
546 [IPCTNL_MSG_TIMEOUT_DEFAULT_SET
]= { .call
= cttimeout_default_set
,
547 .attr_count
= CTA_TIMEOUT_MAX
,
548 .policy
= cttimeout_nla_policy
},
549 [IPCTNL_MSG_TIMEOUT_DEFAULT_GET
]= { .call
= cttimeout_default_get
,
550 .attr_count
= CTA_TIMEOUT_MAX
,
551 .policy
= cttimeout_nla_policy
},
554 static const struct nfnetlink_subsystem cttimeout_subsys
= {
555 .name
= "conntrack_timeout",
556 .subsys_id
= NFNL_SUBSYS_CTNETLINK_TIMEOUT
,
557 .cb_count
= IPCTNL_MSG_TIMEOUT_MAX
,
561 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_CTNETLINK_TIMEOUT
);
563 static int __net_init
cttimeout_net_init(struct net
*net
)
565 INIT_LIST_HEAD(&net
->nfct_timeout_list
);
570 static void __net_exit
cttimeout_net_exit(struct net
*net
)
572 struct ctnl_timeout
*cur
, *tmp
;
574 nf_ct_unconfirmed_destroy(net
);
575 ctnl_untimeout(net
, NULL
);
577 list_for_each_entry_safe(cur
, tmp
, &net
->nfct_timeout_list
, head
) {
578 list_del_rcu(&cur
->head
);
579 nf_ct_l4proto_put(cur
->l4proto
);
581 if (refcount_dec_and_test(&cur
->refcnt
))
582 kfree_rcu(cur
, rcu_head
);
586 static struct pernet_operations cttimeout_ops
= {
587 .init
= cttimeout_net_init
,
588 .exit
= cttimeout_net_exit
,
591 static int __init
cttimeout_init(void)
595 ret
= register_pernet_subsys(&cttimeout_ops
);
599 ret
= nfnetlink_subsys_register(&cttimeout_subsys
);
601 pr_err("cttimeout_init: cannot register cttimeout with "
605 #ifdef CONFIG_NF_CONNTRACK_TIMEOUT
606 RCU_INIT_POINTER(nf_ct_timeout_find_get_hook
, ctnl_timeout_find_get
);
607 RCU_INIT_POINTER(nf_ct_timeout_put_hook
, ctnl_timeout_put
);
608 #endif /* CONFIG_NF_CONNTRACK_TIMEOUT */
612 unregister_pernet_subsys(&cttimeout_ops
);
616 static void __exit
cttimeout_exit(void)
618 pr_info("cttimeout: unregistering from nfnetlink.\n");
620 nfnetlink_subsys_unregister(&cttimeout_subsys
);
622 unregister_pernet_subsys(&cttimeout_ops
);
623 #ifdef CONFIG_NF_CONNTRACK_TIMEOUT
624 RCU_INIT_POINTER(nf_ct_timeout_find_get_hook
, NULL
);
625 RCU_INIT_POINTER(nf_ct_timeout_put_hook
, NULL
);
627 #endif /* CONFIG_NF_CONNTRACK_TIMEOUT */
630 module_init(cttimeout_init
);
631 module_exit(cttimeout_exit
);