2 * (C) 2011 Pablo Neira Ayuso <pablo@netfilter.org>
3 * (C) 2011 Intra2net AG <http://www.intra2net.com>
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License version 2 as
7 * published by the Free Software Foundation (or any later at your option).
9 #include <linux/init.h>
10 #include <linux/module.h>
11 #include <linux/kernel.h>
12 #include <linux/skbuff.h>
13 #include <linux/atomic.h>
14 #include <linux/netlink.h>
15 #include <linux/rculist.h>
16 #include <linux/slab.h>
17 #include <linux/types.h>
18 #include <linux/errno.h>
19 #include <net/netlink.h>
22 #include <linux/netfilter.h>
23 #include <linux/netfilter/nfnetlink.h>
24 #include <linux/netfilter/nfnetlink_acct.h>
26 MODULE_LICENSE("GPL");
27 MODULE_AUTHOR("Pablo Neira Ayuso <pablo@netfilter.org>");
28 MODULE_DESCRIPTION("nfacct: Extended Netfilter accounting infrastructure");
30 static LIST_HEAD(nfnl_acct_list
);
36 struct list_head head
;
38 char name
[NFACCT_NAME_MAX
];
39 struct rcu_head rcu_head
;
43 struct nfacct_filter
{
48 #define NFACCT_F_QUOTA (NFACCT_F_QUOTA_PKTS | NFACCT_F_QUOTA_BYTES)
49 #define NFACCT_OVERQUOTA_BIT 2 /* NFACCT_F_OVERQUOTA */
52 nfnl_acct_new(struct sock
*nfnl
, struct sk_buff
*skb
,
53 const struct nlmsghdr
*nlh
, const struct nlattr
* const tb
[])
55 struct nf_acct
*nfacct
, *matching
= NULL
;
57 unsigned int size
= 0;
63 acct_name
= nla_data(tb
[NFACCT_NAME
]);
64 if (strlen(acct_name
) == 0)
67 list_for_each_entry(nfacct
, &nfnl_acct_list
, head
) {
68 if (strncmp(nfacct
->name
, acct_name
, NFACCT_NAME_MAX
) != 0)
71 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
79 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
) {
80 /* reset counters if you request a replacement. */
81 atomic64_set(&matching
->pkts
, 0);
82 atomic64_set(&matching
->bytes
, 0);
83 smp_mb__before_atomic();
84 /* reset overquota flag if quota is enabled. */
85 if ((matching
->flags
& NFACCT_F_QUOTA
))
86 clear_bit(NFACCT_OVERQUOTA_BIT
,
93 if (tb
[NFACCT_FLAGS
]) {
94 flags
= ntohl(nla_get_be32(tb
[NFACCT_FLAGS
]));
95 if (flags
& ~NFACCT_F_QUOTA
)
97 if ((flags
& NFACCT_F_QUOTA
) == NFACCT_F_QUOTA
)
99 if (flags
& NFACCT_F_OVERQUOTA
)
105 nfacct
= kzalloc(sizeof(struct nf_acct
) + size
, GFP_KERNEL
);
109 if (flags
& NFACCT_F_QUOTA
) {
110 u64
*quota
= (u64
*)nfacct
->data
;
112 *quota
= be64_to_cpu(nla_get_be64(tb
[NFACCT_QUOTA
]));
113 nfacct
->flags
= flags
;
116 strncpy(nfacct
->name
, nla_data(tb
[NFACCT_NAME
]), NFACCT_NAME_MAX
);
118 if (tb
[NFACCT_BYTES
]) {
119 atomic64_set(&nfacct
->bytes
,
120 be64_to_cpu(nla_get_be64(tb
[NFACCT_BYTES
])));
122 if (tb
[NFACCT_PKTS
]) {
123 atomic64_set(&nfacct
->pkts
,
124 be64_to_cpu(nla_get_be64(tb
[NFACCT_PKTS
])));
126 atomic_set(&nfacct
->refcnt
, 1);
127 list_add_tail_rcu(&nfacct
->head
, &nfnl_acct_list
);
132 nfnl_acct_fill_info(struct sk_buff
*skb
, u32 portid
, u32 seq
, u32 type
,
133 int event
, struct nf_acct
*acct
)
135 struct nlmsghdr
*nlh
;
136 struct nfgenmsg
*nfmsg
;
137 unsigned int flags
= portid
? NLM_F_MULTI
: 0;
141 event
|= NFNL_SUBSYS_ACCT
<< 8;
142 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(*nfmsg
), flags
);
146 nfmsg
= nlmsg_data(nlh
);
147 nfmsg
->nfgen_family
= AF_UNSPEC
;
148 nfmsg
->version
= NFNETLINK_V0
;
151 if (nla_put_string(skb
, NFACCT_NAME
, acct
->name
))
152 goto nla_put_failure
;
154 old_flags
= acct
->flags
;
155 if (type
== NFNL_MSG_ACCT_GET_CTRZERO
) {
156 pkts
= atomic64_xchg(&acct
->pkts
, 0);
157 bytes
= atomic64_xchg(&acct
->bytes
, 0);
158 smp_mb__before_atomic();
159 if (acct
->flags
& NFACCT_F_QUOTA
)
160 clear_bit(NFACCT_OVERQUOTA_BIT
, &acct
->flags
);
162 pkts
= atomic64_read(&acct
->pkts
);
163 bytes
= atomic64_read(&acct
->bytes
);
165 if (nla_put_be64(skb
, NFACCT_PKTS
, cpu_to_be64(pkts
)) ||
166 nla_put_be64(skb
, NFACCT_BYTES
, cpu_to_be64(bytes
)) ||
167 nla_put_be32(skb
, NFACCT_USE
, htonl(atomic_read(&acct
->refcnt
))))
168 goto nla_put_failure
;
169 if (acct
->flags
& NFACCT_F_QUOTA
) {
170 u64
*quota
= (u64
*)acct
->data
;
172 if (nla_put_be32(skb
, NFACCT_FLAGS
, htonl(old_flags
)) ||
173 nla_put_be64(skb
, NFACCT_QUOTA
, cpu_to_be64(*quota
)))
174 goto nla_put_failure
;
181 nlmsg_cancel(skb
, nlh
);
186 nfnl_acct_dump(struct sk_buff
*skb
, struct netlink_callback
*cb
)
188 struct nf_acct
*cur
, *last
;
189 const struct nfacct_filter
*filter
= cb
->data
;
194 last
= (struct nf_acct
*)cb
->args
[1];
199 list_for_each_entry_rcu(cur
, &nfnl_acct_list
, head
) {
207 if (filter
&& (cur
->flags
& filter
->mask
) != filter
->value
)
210 if (nfnl_acct_fill_info(skb
, NETLINK_CB(cb
->skb
).portid
,
212 NFNL_MSG_TYPE(cb
->nlh
->nlmsg_type
),
213 NFNL_MSG_ACCT_NEW
, cur
) < 0) {
214 cb
->args
[1] = (unsigned long)cur
;
224 static int nfnl_acct_done(struct netlink_callback
*cb
)
230 static const struct nla_policy filter_policy
[NFACCT_FILTER_MAX
+ 1] = {
231 [NFACCT_FILTER_MASK
] = { .type
= NLA_U32
},
232 [NFACCT_FILTER_VALUE
] = { .type
= NLA_U32
},
235 static struct nfacct_filter
*
236 nfacct_filter_alloc(const struct nlattr
* const attr
)
238 struct nfacct_filter
*filter
;
239 struct nlattr
*tb
[NFACCT_FILTER_MAX
+ 1];
242 err
= nla_parse_nested(tb
, NFACCT_FILTER_MAX
, attr
, filter_policy
);
246 filter
= kzalloc(sizeof(struct nfacct_filter
), GFP_KERNEL
);
248 return ERR_PTR(-ENOMEM
);
250 filter
->mask
= ntohl(nla_get_be32(tb
[NFACCT_FILTER_MASK
]));
251 filter
->value
= ntohl(nla_get_be32(tb
[NFACCT_FILTER_VALUE
]));
257 nfnl_acct_get(struct sock
*nfnl
, struct sk_buff
*skb
,
258 const struct nlmsghdr
*nlh
, const struct nlattr
* const tb
[])
264 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
265 struct netlink_dump_control c
= {
266 .dump
= nfnl_acct_dump
,
267 .done
= nfnl_acct_done
,
270 if (tb
[NFACCT_FILTER
]) {
271 struct nfacct_filter
*filter
;
273 filter
= nfacct_filter_alloc(tb
[NFACCT_FILTER
]);
275 return PTR_ERR(filter
);
279 return netlink_dump_start(nfnl
, skb
, nlh
, &c
);
282 if (!tb
[NFACCT_NAME
])
284 acct_name
= nla_data(tb
[NFACCT_NAME
]);
286 list_for_each_entry(cur
, &nfnl_acct_list
, head
) {
287 struct sk_buff
*skb2
;
289 if (strncmp(cur
->name
, acct_name
, NFACCT_NAME_MAX
)!= 0)
292 skb2
= nlmsg_new(NLMSG_DEFAULT_SIZE
, GFP_KERNEL
);
298 ret
= nfnl_acct_fill_info(skb2
, NETLINK_CB(skb
).portid
,
300 NFNL_MSG_TYPE(nlh
->nlmsg_type
),
301 NFNL_MSG_ACCT_NEW
, cur
);
306 ret
= netlink_unicast(nfnl
, skb2
, NETLINK_CB(skb
).portid
,
311 /* this avoids a loop in nfnetlink. */
312 return ret
== -EAGAIN
? -ENOBUFS
: ret
;
317 /* try to delete object, fail if it is still in use. */
318 static int nfnl_acct_try_del(struct nf_acct
*cur
)
322 /* we want to avoid races with nfnl_acct_find_get. */
323 if (atomic_dec_and_test(&cur
->refcnt
)) {
324 /* We are protected by nfnl mutex. */
325 list_del_rcu(&cur
->head
);
326 kfree_rcu(cur
, rcu_head
);
328 /* still in use, restore reference counter. */
329 atomic_inc(&cur
->refcnt
);
336 nfnl_acct_del(struct sock
*nfnl
, struct sk_buff
*skb
,
337 const struct nlmsghdr
*nlh
, const struct nlattr
* const tb
[])
343 if (!tb
[NFACCT_NAME
]) {
344 list_for_each_entry(cur
, &nfnl_acct_list
, head
)
345 nfnl_acct_try_del(cur
);
349 acct_name
= nla_data(tb
[NFACCT_NAME
]);
351 list_for_each_entry(cur
, &nfnl_acct_list
, head
) {
352 if (strncmp(cur
->name
, acct_name
, NFACCT_NAME_MAX
) != 0)
355 ret
= nfnl_acct_try_del(cur
);
364 static const struct nla_policy nfnl_acct_policy
[NFACCT_MAX
+1] = {
365 [NFACCT_NAME
] = { .type
= NLA_NUL_STRING
, .len
= NFACCT_NAME_MAX
-1 },
366 [NFACCT_BYTES
] = { .type
= NLA_U64
},
367 [NFACCT_PKTS
] = { .type
= NLA_U64
},
368 [NFACCT_FLAGS
] = { .type
= NLA_U32
},
369 [NFACCT_QUOTA
] = { .type
= NLA_U64
},
370 [NFACCT_FILTER
] = {.type
= NLA_NESTED
},
373 static const struct nfnl_callback nfnl_acct_cb
[NFNL_MSG_ACCT_MAX
] = {
374 [NFNL_MSG_ACCT_NEW
] = { .call
= nfnl_acct_new
,
375 .attr_count
= NFACCT_MAX
,
376 .policy
= nfnl_acct_policy
},
377 [NFNL_MSG_ACCT_GET
] = { .call
= nfnl_acct_get
,
378 .attr_count
= NFACCT_MAX
,
379 .policy
= nfnl_acct_policy
},
380 [NFNL_MSG_ACCT_GET_CTRZERO
] = { .call
= nfnl_acct_get
,
381 .attr_count
= NFACCT_MAX
,
382 .policy
= nfnl_acct_policy
},
383 [NFNL_MSG_ACCT_DEL
] = { .call
= nfnl_acct_del
,
384 .attr_count
= NFACCT_MAX
,
385 .policy
= nfnl_acct_policy
},
388 static const struct nfnetlink_subsystem nfnl_acct_subsys
= {
390 .subsys_id
= NFNL_SUBSYS_ACCT
,
391 .cb_count
= NFNL_MSG_ACCT_MAX
,
395 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_ACCT
);
397 struct nf_acct
*nfnl_acct_find_get(const char *acct_name
)
399 struct nf_acct
*cur
, *acct
= NULL
;
402 list_for_each_entry_rcu(cur
, &nfnl_acct_list
, head
) {
403 if (strncmp(cur
->name
, acct_name
, NFACCT_NAME_MAX
)!= 0)
406 if (!try_module_get(THIS_MODULE
))
409 if (!atomic_inc_not_zero(&cur
->refcnt
)) {
410 module_put(THIS_MODULE
);
421 EXPORT_SYMBOL_GPL(nfnl_acct_find_get
);
423 void nfnl_acct_put(struct nf_acct
*acct
)
425 atomic_dec(&acct
->refcnt
);
426 module_put(THIS_MODULE
);
428 EXPORT_SYMBOL_GPL(nfnl_acct_put
);
430 void nfnl_acct_update(const struct sk_buff
*skb
, struct nf_acct
*nfacct
)
432 atomic64_inc(&nfacct
->pkts
);
433 atomic64_add(skb
->len
, &nfacct
->bytes
);
435 EXPORT_SYMBOL_GPL(nfnl_acct_update
);
437 static void nfnl_overquota_report(struct nf_acct
*nfacct
)
442 skb
= nlmsg_new(NLMSG_DEFAULT_SIZE
, GFP_ATOMIC
);
446 ret
= nfnl_acct_fill_info(skb
, 0, 0, NFNL_MSG_ACCT_OVERQUOTA
, 0,
452 netlink_broadcast(init_net
.nfnl
, skb
, 0, NFNLGRP_ACCT_QUOTA
,
456 int nfnl_acct_overquota(const struct sk_buff
*skb
, struct nf_acct
*nfacct
)
460 int ret
= NFACCT_UNDERQUOTA
;
462 /* no place here if we don't have a quota */
463 if (!(nfacct
->flags
& NFACCT_F_QUOTA
))
464 return NFACCT_NO_QUOTA
;
466 quota
= (u64
*)nfacct
->data
;
467 now
= (nfacct
->flags
& NFACCT_F_QUOTA_PKTS
) ?
468 atomic64_read(&nfacct
->pkts
) : atomic64_read(&nfacct
->bytes
);
473 !test_and_set_bit(NFACCT_OVERQUOTA_BIT
, &nfacct
->flags
)) {
474 nfnl_overquota_report(nfacct
);
479 EXPORT_SYMBOL_GPL(nfnl_acct_overquota
);
481 static int __init
nfnl_acct_init(void)
485 pr_info("nfnl_acct: registering with nfnetlink.\n");
486 ret
= nfnetlink_subsys_register(&nfnl_acct_subsys
);
488 pr_err("nfnl_acct_init: cannot register with nfnetlink.\n");
496 static void __exit
nfnl_acct_exit(void)
498 struct nf_acct
*cur
, *tmp
;
500 pr_info("nfnl_acct: unregistering from nfnetlink.\n");
501 nfnetlink_subsys_unregister(&nfnl_acct_subsys
);
503 list_for_each_entry_safe(cur
, tmp
, &nfnl_acct_list
, head
) {
504 list_del_rcu(&cur
->head
);
505 /* We are sure that our objects have no clients at this point,
506 * it's safe to release them all without checking refcnt. */
507 kfree_rcu(cur
, rcu_head
);
511 module_init(nfnl_acct_init
);
512 module_exit(nfnl_acct_exit
);