2 * x_tables core - Backend for {ip,ip6,arp}_tables
4 * Copyright (C) 2006-2006 Harald Welte <laforge@netfilter.org>
5 * Copyright (C) 2006-2012 Patrick McHardy <kaber@trash.net>
7 * Based on existing ip_tables code which is
8 * Copyright (C) 1999 Paul `Rusty' Russell & Michael J. Neuling
9 * Copyright (C) 2000-2005 Netfilter Core Team <coreteam@netfilter.org>
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2 as
13 * published by the Free Software Foundation.
16 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
17 #include <linux/kernel.h>
18 #include <linux/module.h>
19 #include <linux/socket.h>
20 #include <linux/net.h>
21 #include <linux/proc_fs.h>
22 #include <linux/seq_file.h>
23 #include <linux/string.h>
24 #include <linux/vmalloc.h>
25 #include <linux/mutex.h>
27 #include <linux/slab.h>
28 #include <linux/audit.h>
29 #include <linux/user_namespace.h>
30 #include <net/net_namespace.h>
32 #include <linux/netfilter/x_tables.h>
33 #include <linux/netfilter_arp.h>
34 #include <linux/netfilter_ipv4/ip_tables.h>
35 #include <linux/netfilter_ipv6/ip6_tables.h>
36 #include <linux/netfilter_arp/arp_tables.h>
38 MODULE_LICENSE("GPL");
39 MODULE_AUTHOR("Harald Welte <laforge@netfilter.org>");
40 MODULE_DESCRIPTION("{ip,ip6,arp,eb}_tables backend module");
42 #define XT_PCPU_BLOCK_SIZE 4096
45 unsigned int offset
; /* offset in kernel */
46 int delta
; /* delta in 32bit user land */
51 struct list_head match
;
52 struct list_head target
;
54 struct mutex compat_mutex
;
55 struct compat_delta
*compat_tab
;
56 unsigned int number
; /* number of slots in compat_tab[] */
57 unsigned int cur
; /* number of used slots in compat_tab[] */
61 static struct xt_af
*xt
;
63 static const char *const xt_prefix
[NFPROTO_NUMPROTO
] = {
64 [NFPROTO_UNSPEC
] = "x",
65 [NFPROTO_IPV4
] = "ip",
66 [NFPROTO_ARP
] = "arp",
67 [NFPROTO_BRIDGE
] = "eb",
68 [NFPROTO_IPV6
] = "ip6",
71 /* Registration hooks for targets. */
72 int xt_register_target(struct xt_target
*target
)
74 u_int8_t af
= target
->family
;
76 mutex_lock(&xt
[af
].mutex
);
77 list_add(&target
->list
, &xt
[af
].target
);
78 mutex_unlock(&xt
[af
].mutex
);
81 EXPORT_SYMBOL(xt_register_target
);
84 xt_unregister_target(struct xt_target
*target
)
86 u_int8_t af
= target
->family
;
88 mutex_lock(&xt
[af
].mutex
);
89 list_del(&target
->list
);
90 mutex_unlock(&xt
[af
].mutex
);
92 EXPORT_SYMBOL(xt_unregister_target
);
95 xt_register_targets(struct xt_target
*target
, unsigned int n
)
100 for (i
= 0; i
< n
; i
++) {
101 err
= xt_register_target(&target
[i
]);
109 xt_unregister_targets(target
, i
);
112 EXPORT_SYMBOL(xt_register_targets
);
115 xt_unregister_targets(struct xt_target
*target
, unsigned int n
)
118 xt_unregister_target(&target
[n
]);
120 EXPORT_SYMBOL(xt_unregister_targets
);
122 int xt_register_match(struct xt_match
*match
)
124 u_int8_t af
= match
->family
;
126 mutex_lock(&xt
[af
].mutex
);
127 list_add(&match
->list
, &xt
[af
].match
);
128 mutex_unlock(&xt
[af
].mutex
);
131 EXPORT_SYMBOL(xt_register_match
);
134 xt_unregister_match(struct xt_match
*match
)
136 u_int8_t af
= match
->family
;
138 mutex_lock(&xt
[af
].mutex
);
139 list_del(&match
->list
);
140 mutex_unlock(&xt
[af
].mutex
);
142 EXPORT_SYMBOL(xt_unregister_match
);
145 xt_register_matches(struct xt_match
*match
, unsigned int n
)
150 for (i
= 0; i
< n
; i
++) {
151 err
= xt_register_match(&match
[i
]);
159 xt_unregister_matches(match
, i
);
162 EXPORT_SYMBOL(xt_register_matches
);
165 xt_unregister_matches(struct xt_match
*match
, unsigned int n
)
168 xt_unregister_match(&match
[n
]);
170 EXPORT_SYMBOL(xt_unregister_matches
);
174 * These are weird, but module loading must not be done with mutex
175 * held (since they will register), and we have to have a single
179 /* Find match, grabs ref. Returns ERR_PTR() on error. */
180 struct xt_match
*xt_find_match(u8 af
, const char *name
, u8 revision
)
185 mutex_lock(&xt
[af
].mutex
);
186 list_for_each_entry(m
, &xt
[af
].match
, list
) {
187 if (strcmp(m
->name
, name
) == 0) {
188 if (m
->revision
== revision
) {
189 if (try_module_get(m
->me
)) {
190 mutex_unlock(&xt
[af
].mutex
);
194 err
= -EPROTOTYPE
; /* Found something. */
197 mutex_unlock(&xt
[af
].mutex
);
199 if (af
!= NFPROTO_UNSPEC
)
200 /* Try searching again in the family-independent list */
201 return xt_find_match(NFPROTO_UNSPEC
, name
, revision
);
205 EXPORT_SYMBOL(xt_find_match
);
208 xt_request_find_match(uint8_t nfproto
, const char *name
, uint8_t revision
)
210 struct xt_match
*match
;
212 if (strnlen(name
, XT_EXTENSION_MAXNAMELEN
) == XT_EXTENSION_MAXNAMELEN
)
213 return ERR_PTR(-EINVAL
);
215 match
= xt_find_match(nfproto
, name
, revision
);
217 request_module("%st_%s", xt_prefix
[nfproto
], name
);
218 match
= xt_find_match(nfproto
, name
, revision
);
223 EXPORT_SYMBOL_GPL(xt_request_find_match
);
225 /* Find target, grabs ref. Returns ERR_PTR() on error. */
226 struct xt_target
*xt_find_target(u8 af
, const char *name
, u8 revision
)
231 mutex_lock(&xt
[af
].mutex
);
232 list_for_each_entry(t
, &xt
[af
].target
, list
) {
233 if (strcmp(t
->name
, name
) == 0) {
234 if (t
->revision
== revision
) {
235 if (try_module_get(t
->me
)) {
236 mutex_unlock(&xt
[af
].mutex
);
240 err
= -EPROTOTYPE
; /* Found something. */
243 mutex_unlock(&xt
[af
].mutex
);
245 if (af
!= NFPROTO_UNSPEC
)
246 /* Try searching again in the family-independent list */
247 return xt_find_target(NFPROTO_UNSPEC
, name
, revision
);
251 EXPORT_SYMBOL(xt_find_target
);
253 struct xt_target
*xt_request_find_target(u8 af
, const char *name
, u8 revision
)
255 struct xt_target
*target
;
257 if (strnlen(name
, XT_EXTENSION_MAXNAMELEN
) == XT_EXTENSION_MAXNAMELEN
)
258 return ERR_PTR(-EINVAL
);
260 target
= xt_find_target(af
, name
, revision
);
261 if (IS_ERR(target
)) {
262 request_module("%st_%s", xt_prefix
[af
], name
);
263 target
= xt_find_target(af
, name
, revision
);
268 EXPORT_SYMBOL_GPL(xt_request_find_target
);
271 static int xt_obj_to_user(u16 __user
*psize
, u16 size
,
272 void __user
*pname
, const char *name
,
273 u8 __user
*prev
, u8 rev
)
275 if (put_user(size
, psize
))
277 if (copy_to_user(pname
, name
, strlen(name
) + 1))
279 if (put_user(rev
, prev
))
285 #define XT_OBJ_TO_USER(U, K, TYPE, C_SIZE) \
286 xt_obj_to_user(&U->u.TYPE##_size, C_SIZE ? : K->u.TYPE##_size, \
287 U->u.user.name, K->u.kernel.TYPE->name, \
288 &U->u.user.revision, K->u.kernel.TYPE->revision)
290 int xt_data_to_user(void __user
*dst
, const void *src
,
291 int usersize
, int size
, int aligned_size
)
293 usersize
= usersize
? : size
;
294 if (copy_to_user(dst
, src
, usersize
))
296 if (usersize
!= aligned_size
&&
297 clear_user(dst
+ usersize
, aligned_size
- usersize
))
302 EXPORT_SYMBOL_GPL(xt_data_to_user
);
304 #define XT_DATA_TO_USER(U, K, TYPE) \
305 xt_data_to_user(U->data, K->data, \
306 K->u.kernel.TYPE->usersize, \
307 K->u.kernel.TYPE->TYPE##size, \
308 XT_ALIGN(K->u.kernel.TYPE->TYPE##size))
310 int xt_match_to_user(const struct xt_entry_match
*m
,
311 struct xt_entry_match __user
*u
)
313 return XT_OBJ_TO_USER(u
, m
, match
, 0) ||
314 XT_DATA_TO_USER(u
, m
, match
);
316 EXPORT_SYMBOL_GPL(xt_match_to_user
);
318 int xt_target_to_user(const struct xt_entry_target
*t
,
319 struct xt_entry_target __user
*u
)
321 return XT_OBJ_TO_USER(u
, t
, target
, 0) ||
322 XT_DATA_TO_USER(u
, t
, target
);
324 EXPORT_SYMBOL_GPL(xt_target_to_user
);
326 static int match_revfn(u8 af
, const char *name
, u8 revision
, int *bestp
)
328 const struct xt_match
*m
;
331 list_for_each_entry(m
, &xt
[af
].match
, list
) {
332 if (strcmp(m
->name
, name
) == 0) {
333 if (m
->revision
> *bestp
)
334 *bestp
= m
->revision
;
335 if (m
->revision
== revision
)
340 if (af
!= NFPROTO_UNSPEC
&& !have_rev
)
341 return match_revfn(NFPROTO_UNSPEC
, name
, revision
, bestp
);
346 static int target_revfn(u8 af
, const char *name
, u8 revision
, int *bestp
)
348 const struct xt_target
*t
;
351 list_for_each_entry(t
, &xt
[af
].target
, list
) {
352 if (strcmp(t
->name
, name
) == 0) {
353 if (t
->revision
> *bestp
)
354 *bestp
= t
->revision
;
355 if (t
->revision
== revision
)
360 if (af
!= NFPROTO_UNSPEC
&& !have_rev
)
361 return target_revfn(NFPROTO_UNSPEC
, name
, revision
, bestp
);
366 /* Returns true or false (if no such extension at all) */
367 int xt_find_revision(u8 af
, const char *name
, u8 revision
, int target
,
370 int have_rev
, best
= -1;
372 mutex_lock(&xt
[af
].mutex
);
374 have_rev
= target_revfn(af
, name
, revision
, &best
);
376 have_rev
= match_revfn(af
, name
, revision
, &best
);
377 mutex_unlock(&xt
[af
].mutex
);
379 /* Nothing at all? Return 0 to try loading module. */
387 *err
= -EPROTONOSUPPORT
;
390 EXPORT_SYMBOL_GPL(xt_find_revision
);
393 textify_hooks(char *buf
, size_t size
, unsigned int mask
, uint8_t nfproto
)
395 static const char *const inetbr_names
[] = {
396 "PREROUTING", "INPUT", "FORWARD",
397 "OUTPUT", "POSTROUTING", "BROUTING",
399 static const char *const arp_names
[] = {
400 "INPUT", "FORWARD", "OUTPUT",
402 const char *const *names
;
408 names
= (nfproto
== NFPROTO_ARP
) ? arp_names
: inetbr_names
;
409 max
= (nfproto
== NFPROTO_ARP
) ? ARRAY_SIZE(arp_names
) :
410 ARRAY_SIZE(inetbr_names
);
412 for (i
= 0; i
< max
; ++i
) {
413 if (!(mask
& (1 << i
)))
415 res
= snprintf(p
, size
, "%s%s", np
? "/" : "", names
[i
]);
426 int xt_check_match(struct xt_mtchk_param
*par
,
427 unsigned int size
, u_int8_t proto
, bool inv_proto
)
431 if (XT_ALIGN(par
->match
->matchsize
) != size
&&
432 par
->match
->matchsize
!= -1) {
434 * ebt_among is exempt from centralized matchsize checking
435 * because it uses a dynamic-size data set.
437 pr_err("%s_tables: %s.%u match: invalid size "
438 "%u (kernel) != (user) %u\n",
439 xt_prefix
[par
->family
], par
->match
->name
,
440 par
->match
->revision
,
441 XT_ALIGN(par
->match
->matchsize
), size
);
444 if (par
->match
->table
!= NULL
&&
445 strcmp(par
->match
->table
, par
->table
) != 0) {
446 pr_err("%s_tables: %s match: only valid in %s table, not %s\n",
447 xt_prefix
[par
->family
], par
->match
->name
,
448 par
->match
->table
, par
->table
);
451 if (par
->match
->hooks
&& (par
->hook_mask
& ~par
->match
->hooks
) != 0) {
452 char used
[64], allow
[64];
454 pr_err("%s_tables: %s match: used from hooks %s, but only "
456 xt_prefix
[par
->family
], par
->match
->name
,
457 textify_hooks(used
, sizeof(used
), par
->hook_mask
,
459 textify_hooks(allow
, sizeof(allow
), par
->match
->hooks
,
463 if (par
->match
->proto
&& (par
->match
->proto
!= proto
|| inv_proto
)) {
464 pr_err("%s_tables: %s match: only valid for protocol %u\n",
465 xt_prefix
[par
->family
], par
->match
->name
,
469 if (par
->match
->checkentry
!= NULL
) {
470 ret
= par
->match
->checkentry(par
);
474 /* Flag up potential errors. */
479 EXPORT_SYMBOL_GPL(xt_check_match
);
481 /** xt_check_entry_match - check that matches end before start of target
483 * @match: beginning of xt_entry_match
484 * @target: beginning of this rules target (alleged end of matches)
485 * @alignment: alignment requirement of match structures
487 * Validates that all matches add up to the beginning of the target,
488 * and that each match covers at least the base structure size.
490 * Return: 0 on success, negative errno on failure.
492 static int xt_check_entry_match(const char *match
, const char *target
,
493 const size_t alignment
)
495 const struct xt_entry_match
*pos
;
496 int length
= target
- match
;
498 if (length
== 0) /* no matches */
501 pos
= (struct xt_entry_match
*)match
;
503 if ((unsigned long)pos
% alignment
)
506 if (length
< (int)sizeof(struct xt_entry_match
))
509 if (pos
->u
.match_size
< sizeof(struct xt_entry_match
))
512 if (pos
->u
.match_size
> length
)
515 length
-= pos
->u
.match_size
;
516 pos
= ((void *)((char *)(pos
) + (pos
)->u
.match_size
));
517 } while (length
> 0);
523 int xt_compat_add_offset(u_int8_t af
, unsigned int offset
, int delta
)
525 struct xt_af
*xp
= &xt
[af
];
527 if (!xp
->compat_tab
) {
530 xp
->compat_tab
= vmalloc(sizeof(struct compat_delta
) * xp
->number
);
536 if (xp
->cur
>= xp
->number
)
540 delta
+= xp
->compat_tab
[xp
->cur
- 1].delta
;
541 xp
->compat_tab
[xp
->cur
].offset
= offset
;
542 xp
->compat_tab
[xp
->cur
].delta
= delta
;
546 EXPORT_SYMBOL_GPL(xt_compat_add_offset
);
548 void xt_compat_flush_offsets(u_int8_t af
)
550 if (xt
[af
].compat_tab
) {
551 vfree(xt
[af
].compat_tab
);
552 xt
[af
].compat_tab
= NULL
;
557 EXPORT_SYMBOL_GPL(xt_compat_flush_offsets
);
559 int xt_compat_calc_jump(u_int8_t af
, unsigned int offset
)
561 struct compat_delta
*tmp
= xt
[af
].compat_tab
;
562 int mid
, left
= 0, right
= xt
[af
].cur
- 1;
564 while (left
<= right
) {
565 mid
= (left
+ right
) >> 1;
566 if (offset
> tmp
[mid
].offset
)
568 else if (offset
< tmp
[mid
].offset
)
571 return mid
? tmp
[mid
- 1].delta
: 0;
573 return left
? tmp
[left
- 1].delta
: 0;
575 EXPORT_SYMBOL_GPL(xt_compat_calc_jump
);
577 void xt_compat_init_offsets(u_int8_t af
, unsigned int number
)
579 xt
[af
].number
= number
;
582 EXPORT_SYMBOL(xt_compat_init_offsets
);
584 int xt_compat_match_offset(const struct xt_match
*match
)
586 u_int16_t csize
= match
->compatsize
? : match
->matchsize
;
587 return XT_ALIGN(match
->matchsize
) - COMPAT_XT_ALIGN(csize
);
589 EXPORT_SYMBOL_GPL(xt_compat_match_offset
);
591 void xt_compat_match_from_user(struct xt_entry_match
*m
, void **dstptr
,
594 const struct xt_match
*match
= m
->u
.kernel
.match
;
595 struct compat_xt_entry_match
*cm
= (struct compat_xt_entry_match
*)m
;
596 int pad
, off
= xt_compat_match_offset(match
);
597 u_int16_t msize
= cm
->u
.user
.match_size
;
598 char name
[sizeof(m
->u
.user
.name
)];
601 memcpy(m
, cm
, sizeof(*cm
));
602 if (match
->compat_from_user
)
603 match
->compat_from_user(m
->data
, cm
->data
);
605 memcpy(m
->data
, cm
->data
, msize
- sizeof(*cm
));
606 pad
= XT_ALIGN(match
->matchsize
) - match
->matchsize
;
608 memset(m
->data
+ match
->matchsize
, 0, pad
);
611 m
->u
.user
.match_size
= msize
;
612 strlcpy(name
, match
->name
, sizeof(name
));
613 module_put(match
->me
);
614 strncpy(m
->u
.user
.name
, name
, sizeof(m
->u
.user
.name
));
619 EXPORT_SYMBOL_GPL(xt_compat_match_from_user
);
621 #define COMPAT_XT_DATA_TO_USER(U, K, TYPE, C_SIZE) \
622 xt_data_to_user(U->data, K->data, \
623 K->u.kernel.TYPE->usersize, \
625 COMPAT_XT_ALIGN(C_SIZE))
627 int xt_compat_match_to_user(const struct xt_entry_match
*m
,
628 void __user
**dstptr
, unsigned int *size
)
630 const struct xt_match
*match
= m
->u
.kernel
.match
;
631 struct compat_xt_entry_match __user
*cm
= *dstptr
;
632 int off
= xt_compat_match_offset(match
);
633 u_int16_t msize
= m
->u
.user
.match_size
- off
;
635 if (XT_OBJ_TO_USER(cm
, m
, match
, msize
))
638 if (match
->compat_to_user
) {
639 if (match
->compat_to_user((void __user
*)cm
->data
, m
->data
))
642 if (COMPAT_XT_DATA_TO_USER(cm
, m
, match
, msize
- sizeof(*cm
)))
650 EXPORT_SYMBOL_GPL(xt_compat_match_to_user
);
652 /* non-compat version may have padding after verdict */
653 struct compat_xt_standard_target
{
654 struct compat_xt_entry_target t
;
655 compat_uint_t verdict
;
658 int xt_compat_check_entry_offsets(const void *base
, const char *elems
,
659 unsigned int target_offset
,
660 unsigned int next_offset
)
662 long size_of_base_struct
= elems
- (const char *)base
;
663 const struct compat_xt_entry_target
*t
;
664 const char *e
= base
;
666 if (target_offset
< size_of_base_struct
)
669 if (target_offset
+ sizeof(*t
) > next_offset
)
672 t
= (void *)(e
+ target_offset
);
673 if (t
->u
.target_size
< sizeof(*t
))
676 if (target_offset
+ t
->u
.target_size
> next_offset
)
679 if (strcmp(t
->u
.user
.name
, XT_STANDARD_TARGET
) == 0 &&
680 COMPAT_XT_ALIGN(target_offset
+ sizeof(struct compat_xt_standard_target
)) != next_offset
)
683 /* compat_xt_entry match has less strict alignment requirements,
684 * otherwise they are identical. In case of padding differences
685 * we need to add compat version of xt_check_entry_match.
687 BUILD_BUG_ON(sizeof(struct compat_xt_entry_match
) != sizeof(struct xt_entry_match
));
689 return xt_check_entry_match(elems
, base
+ target_offset
,
690 __alignof__(struct compat_xt_entry_match
));
692 EXPORT_SYMBOL(xt_compat_check_entry_offsets
);
693 #endif /* CONFIG_COMPAT */
696 * xt_check_entry_offsets - validate arp/ip/ip6t_entry
698 * @base: pointer to arp/ip/ip6t_entry
699 * @elems: pointer to first xt_entry_match, i.e. ip(6)t_entry->elems
700 * @target_offset: the arp/ip/ip6_t->target_offset
701 * @next_offset: the arp/ip/ip6_t->next_offset
703 * validates that target_offset and next_offset are sane and that all
704 * match sizes (if any) align with the target offset.
706 * This function does not validate the targets or matches themselves, it
707 * only tests that all the offsets and sizes are correct, that all
708 * match structures are aligned, and that the last structure ends where
709 * the target structure begins.
711 * Also see xt_compat_check_entry_offsets for CONFIG_COMPAT version.
713 * The arp/ip/ip6t_entry structure @base must have passed following tests:
714 * - it must point to a valid memory location
715 * - base to base + next_offset must be accessible, i.e. not exceed allocated
718 * A well-formed entry looks like this:
720 * ip(6)t_entry match [mtdata] match [mtdata] target [tgdata] ip(6)t_entry
721 * e->elems[]-----' | |
725 * target_offset---------------------------------' |
726 * next_offset---------------------------------------------------'
728 * elems[]: flexible array member at end of ip(6)/arpt_entry struct.
729 * This is where matches (if any) and the target reside.
730 * target_offset: beginning of target.
731 * next_offset: start of the next rule; also: size of this rule.
732 * Since targets have a minimum size, target_offset + minlen <= next_offset.
734 * Every match stores its size, sum of sizes must not exceed target_offset.
736 * Return: 0 on success, negative errno on failure.
738 int xt_check_entry_offsets(const void *base
,
740 unsigned int target_offset
,
741 unsigned int next_offset
)
743 long size_of_base_struct
= elems
- (const char *)base
;
744 const struct xt_entry_target
*t
;
745 const char *e
= base
;
747 /* target start is within the ip/ip6/arpt_entry struct */
748 if (target_offset
< size_of_base_struct
)
751 if (target_offset
+ sizeof(*t
) > next_offset
)
754 t
= (void *)(e
+ target_offset
);
755 if (t
->u
.target_size
< sizeof(*t
))
758 if (target_offset
+ t
->u
.target_size
> next_offset
)
761 if (strcmp(t
->u
.user
.name
, XT_STANDARD_TARGET
) == 0 &&
762 XT_ALIGN(target_offset
+ sizeof(struct xt_standard_target
)) != next_offset
)
765 return xt_check_entry_match(elems
, base
+ target_offset
,
766 __alignof__(struct xt_entry_match
));
768 EXPORT_SYMBOL(xt_check_entry_offsets
);
771 * xt_alloc_entry_offsets - allocate array to store rule head offsets
773 * @size: number of entries
775 * Return: NULL or kmalloc'd or vmalloc'd array
777 unsigned int *xt_alloc_entry_offsets(unsigned int size
)
779 return kvmalloc_array(size
, sizeof(unsigned int), GFP_KERNEL
| __GFP_ZERO
);
782 EXPORT_SYMBOL(xt_alloc_entry_offsets
);
785 * xt_find_jump_offset - check if target is a valid jump offset
787 * @offsets: array containing all valid rule start offsets of a rule blob
788 * @target: the jump target to search for
789 * @size: entries in @offset
791 bool xt_find_jump_offset(const unsigned int *offsets
,
792 unsigned int target
, unsigned int size
)
794 int m
, low
= 0, hi
= size
;
799 if (offsets
[m
] > target
)
801 else if (offsets
[m
] < target
)
809 EXPORT_SYMBOL(xt_find_jump_offset
);
811 int xt_check_target(struct xt_tgchk_param
*par
,
812 unsigned int size
, u_int8_t proto
, bool inv_proto
)
816 if (XT_ALIGN(par
->target
->targetsize
) != size
) {
817 pr_err("%s_tables: %s.%u target: invalid size "
818 "%u (kernel) != (user) %u\n",
819 xt_prefix
[par
->family
], par
->target
->name
,
820 par
->target
->revision
,
821 XT_ALIGN(par
->target
->targetsize
), size
);
824 if (par
->target
->table
!= NULL
&&
825 strcmp(par
->target
->table
, par
->table
) != 0) {
826 pr_err("%s_tables: %s target: only valid in %s table, not %s\n",
827 xt_prefix
[par
->family
], par
->target
->name
,
828 par
->target
->table
, par
->table
);
831 if (par
->target
->hooks
&& (par
->hook_mask
& ~par
->target
->hooks
) != 0) {
832 char used
[64], allow
[64];
834 pr_err("%s_tables: %s target: used from hooks %s, but only "
836 xt_prefix
[par
->family
], par
->target
->name
,
837 textify_hooks(used
, sizeof(used
), par
->hook_mask
,
839 textify_hooks(allow
, sizeof(allow
), par
->target
->hooks
,
843 if (par
->target
->proto
&& (par
->target
->proto
!= proto
|| inv_proto
)) {
844 pr_err("%s_tables: %s target: only valid for protocol %u\n",
845 xt_prefix
[par
->family
], par
->target
->name
,
849 if (par
->target
->checkentry
!= NULL
) {
850 ret
= par
->target
->checkentry(par
);
854 /* Flag up potential errors. */
859 EXPORT_SYMBOL_GPL(xt_check_target
);
862 * xt_copy_counters_from_user - copy counters and metadata from userspace
864 * @user: src pointer to userspace memory
865 * @len: alleged size of userspace memory
866 * @info: where to store the xt_counters_info metadata
867 * @compat: true if we setsockopt call is done by 32bit task on 64bit kernel
869 * Copies counter meta data from @user and stores it in @info.
871 * vmallocs memory to hold the counters, then copies the counter data
872 * from @user to the new memory and returns a pointer to it.
874 * If @compat is true, @info gets converted automatically to the 64bit
877 * The metadata associated with the counters is stored in @info.
879 * Return: returns pointer that caller has to test via IS_ERR().
880 * If IS_ERR is false, caller has to vfree the pointer.
882 void *xt_copy_counters_from_user(const void __user
*user
, unsigned int len
,
883 struct xt_counters_info
*info
, bool compat
)
890 /* structures only differ in size due to alignment */
891 struct compat_xt_counters_info compat_tmp
;
893 if (len
<= sizeof(compat_tmp
))
894 return ERR_PTR(-EINVAL
);
896 len
-= sizeof(compat_tmp
);
897 if (copy_from_user(&compat_tmp
, user
, sizeof(compat_tmp
)) != 0)
898 return ERR_PTR(-EFAULT
);
900 memcpy(info
->name
, compat_tmp
.name
, sizeof(info
->name
) - 1);
901 info
->num_counters
= compat_tmp
.num_counters
;
902 user
+= sizeof(compat_tmp
);
906 if (len
<= sizeof(*info
))
907 return ERR_PTR(-EINVAL
);
909 len
-= sizeof(*info
);
910 if (copy_from_user(info
, user
, sizeof(*info
)) != 0)
911 return ERR_PTR(-EFAULT
);
913 user
+= sizeof(*info
);
915 info
->name
[sizeof(info
->name
) - 1] = '\0';
917 size
= sizeof(struct xt_counters
);
918 size
*= info
->num_counters
;
920 if (size
!= (u64
)len
)
921 return ERR_PTR(-EINVAL
);
925 return ERR_PTR(-ENOMEM
);
927 if (copy_from_user(mem
, user
, len
) == 0)
931 return ERR_PTR(-EFAULT
);
933 EXPORT_SYMBOL_GPL(xt_copy_counters_from_user
);
936 int xt_compat_target_offset(const struct xt_target
*target
)
938 u_int16_t csize
= target
->compatsize
? : target
->targetsize
;
939 return XT_ALIGN(target
->targetsize
) - COMPAT_XT_ALIGN(csize
);
941 EXPORT_SYMBOL_GPL(xt_compat_target_offset
);
943 void xt_compat_target_from_user(struct xt_entry_target
*t
, void **dstptr
,
946 const struct xt_target
*target
= t
->u
.kernel
.target
;
947 struct compat_xt_entry_target
*ct
= (struct compat_xt_entry_target
*)t
;
948 int pad
, off
= xt_compat_target_offset(target
);
949 u_int16_t tsize
= ct
->u
.user
.target_size
;
950 char name
[sizeof(t
->u
.user
.name
)];
953 memcpy(t
, ct
, sizeof(*ct
));
954 if (target
->compat_from_user
)
955 target
->compat_from_user(t
->data
, ct
->data
);
957 memcpy(t
->data
, ct
->data
, tsize
- sizeof(*ct
));
958 pad
= XT_ALIGN(target
->targetsize
) - target
->targetsize
;
960 memset(t
->data
+ target
->targetsize
, 0, pad
);
963 t
->u
.user
.target_size
= tsize
;
964 strlcpy(name
, target
->name
, sizeof(name
));
965 module_put(target
->me
);
966 strncpy(t
->u
.user
.name
, name
, sizeof(t
->u
.user
.name
));
971 EXPORT_SYMBOL_GPL(xt_compat_target_from_user
);
973 int xt_compat_target_to_user(const struct xt_entry_target
*t
,
974 void __user
**dstptr
, unsigned int *size
)
976 const struct xt_target
*target
= t
->u
.kernel
.target
;
977 struct compat_xt_entry_target __user
*ct
= *dstptr
;
978 int off
= xt_compat_target_offset(target
);
979 u_int16_t tsize
= t
->u
.user
.target_size
- off
;
981 if (XT_OBJ_TO_USER(ct
, t
, target
, tsize
))
984 if (target
->compat_to_user
) {
985 if (target
->compat_to_user((void __user
*)ct
->data
, t
->data
))
988 if (COMPAT_XT_DATA_TO_USER(ct
, t
, target
, tsize
- sizeof(*ct
)))
996 EXPORT_SYMBOL_GPL(xt_compat_target_to_user
);
999 struct xt_table_info
*xt_alloc_table_info(unsigned int size
)
1001 struct xt_table_info
*info
= NULL
;
1002 size_t sz
= sizeof(*info
) + size
;
1004 if (sz
< sizeof(*info
))
1007 /* Pedantry: prevent them from hitting BUG() in vmalloc.c --RR */
1008 if ((size
>> PAGE_SHIFT
) + 2 > totalram_pages
)
1011 /* __GFP_NORETRY is not fully supported by kvmalloc but it should
1012 * work reasonably well if sz is too large and bail out rather
1013 * than shoot all processes down before realizing there is nothing
1016 info
= kvmalloc(sz
, GFP_KERNEL
| __GFP_NORETRY
);
1020 memset(info
, 0, sizeof(*info
));
1024 EXPORT_SYMBOL(xt_alloc_table_info
);
1026 void xt_free_table_info(struct xt_table_info
*info
)
1030 if (info
->jumpstack
!= NULL
) {
1031 for_each_possible_cpu(cpu
)
1032 kvfree(info
->jumpstack
[cpu
]);
1033 kvfree(info
->jumpstack
);
1038 EXPORT_SYMBOL(xt_free_table_info
);
1040 /* Find table by name, grabs mutex & ref. Returns ERR_PTR on error. */
1041 struct xt_table
*xt_find_table_lock(struct net
*net
, u_int8_t af
,
1044 struct xt_table
*t
, *found
= NULL
;
1046 mutex_lock(&xt
[af
].mutex
);
1047 list_for_each_entry(t
, &net
->xt
.tables
[af
], list
)
1048 if (strcmp(t
->name
, name
) == 0 && try_module_get(t
->me
))
1051 if (net
== &init_net
)
1054 /* Table doesn't exist in this netns, re-try init */
1055 list_for_each_entry(t
, &init_net
.xt
.tables
[af
], list
) {
1058 if (strcmp(t
->name
, name
))
1060 if (!try_module_get(t
->me
))
1062 mutex_unlock(&xt
[af
].mutex
);
1063 err
= t
->table_init(net
);
1066 return ERR_PTR(err
);
1071 mutex_lock(&xt
[af
].mutex
);
1078 /* and once again: */
1079 list_for_each_entry(t
, &net
->xt
.tables
[af
], list
)
1080 if (strcmp(t
->name
, name
) == 0)
1083 module_put(found
->me
);
1085 mutex_unlock(&xt
[af
].mutex
);
1086 return ERR_PTR(-ENOENT
);
1088 EXPORT_SYMBOL_GPL(xt_find_table_lock
);
1090 struct xt_table
*xt_request_find_table_lock(struct net
*net
, u_int8_t af
,
1093 struct xt_table
*t
= xt_find_table_lock(net
, af
, name
);
1095 #ifdef CONFIG_MODULES
1097 int err
= request_module("%stable_%s", xt_prefix
[af
], name
);
1099 return ERR_PTR(err
);
1100 t
= xt_find_table_lock(net
, af
, name
);
1106 EXPORT_SYMBOL_GPL(xt_request_find_table_lock
);
1108 void xt_table_unlock(struct xt_table
*table
)
1110 mutex_unlock(&xt
[table
->af
].mutex
);
1112 EXPORT_SYMBOL_GPL(xt_table_unlock
);
1114 #ifdef CONFIG_COMPAT
1115 void xt_compat_lock(u_int8_t af
)
1117 mutex_lock(&xt
[af
].compat_mutex
);
1119 EXPORT_SYMBOL_GPL(xt_compat_lock
);
1121 void xt_compat_unlock(u_int8_t af
)
1123 mutex_unlock(&xt
[af
].compat_mutex
);
1125 EXPORT_SYMBOL_GPL(xt_compat_unlock
);
1128 DEFINE_PER_CPU(seqcount_t
, xt_recseq
);
1129 EXPORT_PER_CPU_SYMBOL_GPL(xt_recseq
);
1131 struct static_key xt_tee_enabled __read_mostly
;
1132 EXPORT_SYMBOL_GPL(xt_tee_enabled
);
1134 static int xt_jumpstack_alloc(struct xt_table_info
*i
)
1139 size
= sizeof(void **) * nr_cpu_ids
;
1140 if (size
> PAGE_SIZE
)
1141 i
->jumpstack
= kvzalloc(size
, GFP_KERNEL
);
1143 i
->jumpstack
= kzalloc(size
, GFP_KERNEL
);
1144 if (i
->jumpstack
== NULL
)
1147 /* ruleset without jumps -- no stack needed */
1148 if (i
->stacksize
== 0)
1151 /* Jumpstack needs to be able to record two full callchains, one
1152 * from the first rule set traversal, plus one table reentrancy
1153 * via -j TEE without clobbering the callchain that brought us to
1156 * This is done by allocating two jumpstacks per cpu, on reentry
1157 * the upper half of the stack is used.
1159 * see the jumpstack setup in ipt_do_table() for more details.
1161 size
= sizeof(void *) * i
->stacksize
* 2u;
1162 for_each_possible_cpu(cpu
) {
1163 i
->jumpstack
[cpu
] = kvmalloc_node(size
, GFP_KERNEL
,
1165 if (i
->jumpstack
[cpu
] == NULL
)
1167 * Freeing will be done later on by the callers. The
1168 * chain is: xt_replace_table -> __do_replace ->
1169 * do_replace -> xt_free_table_info.
1177 struct xt_table_info
*
1178 xt_replace_table(struct xt_table
*table
,
1179 unsigned int num_counters
,
1180 struct xt_table_info
*newinfo
,
1183 struct xt_table_info
*private;
1187 ret
= xt_jumpstack_alloc(newinfo
);
1193 /* Do the substitution. */
1195 private = table
->private;
1197 /* Check inside lock: is the old number correct? */
1198 if (num_counters
!= private->number
) {
1199 pr_debug("num_counters != table->private->number (%u/%u)\n",
1200 num_counters
, private->number
);
1206 newinfo
->initial_entries
= private->initial_entries
;
1208 * Ensure contents of newinfo are visible before assigning to
1212 table
->private = newinfo
;
1214 /* make sure all cpus see new ->private value */
1218 * Even though table entries have now been swapped, other CPU's
1219 * may still be using the old entries...
1223 /* ... so wait for even xt_recseq on all cpus */
1224 for_each_possible_cpu(cpu
) {
1225 seqcount_t
*s
= &per_cpu(xt_recseq
, cpu
);
1226 u32 seq
= raw_read_seqcount(s
);
1232 } while (seq
== raw_read_seqcount(s
));
1237 if (audit_enabled
) {
1238 audit_log(current
->audit_context
, GFP_KERNEL
,
1239 AUDIT_NETFILTER_CFG
,
1240 "table=%s family=%u entries=%u",
1241 table
->name
, table
->af
, private->number
);
1247 EXPORT_SYMBOL_GPL(xt_replace_table
);
1249 struct xt_table
*xt_register_table(struct net
*net
,
1250 const struct xt_table
*input_table
,
1251 struct xt_table_info
*bootstrap
,
1252 struct xt_table_info
*newinfo
)
1255 struct xt_table_info
*private;
1256 struct xt_table
*t
, *table
;
1258 /* Don't add one object to multiple lists. */
1259 table
= kmemdup(input_table
, sizeof(struct xt_table
), GFP_KERNEL
);
1265 mutex_lock(&xt
[table
->af
].mutex
);
1266 /* Don't autoload: we'd eat our tail... */
1267 list_for_each_entry(t
, &net
->xt
.tables
[table
->af
], list
) {
1268 if (strcmp(t
->name
, table
->name
) == 0) {
1274 /* Simplifies replace_table code. */
1275 table
->private = bootstrap
;
1277 if (!xt_replace_table(table
, 0, newinfo
, &ret
))
1280 private = table
->private;
1281 pr_debug("table->private->number = %u\n", private->number
);
1283 /* save number of initial entries */
1284 private->initial_entries
= private->number
;
1286 list_add(&table
->list
, &net
->xt
.tables
[table
->af
]);
1287 mutex_unlock(&xt
[table
->af
].mutex
);
1291 mutex_unlock(&xt
[table
->af
].mutex
);
1294 return ERR_PTR(ret
);
1296 EXPORT_SYMBOL_GPL(xt_register_table
);
1298 void *xt_unregister_table(struct xt_table
*table
)
1300 struct xt_table_info
*private;
1302 mutex_lock(&xt
[table
->af
].mutex
);
1303 private = table
->private;
1304 list_del(&table
->list
);
1305 mutex_unlock(&xt
[table
->af
].mutex
);
1310 EXPORT_SYMBOL_GPL(xt_unregister_table
);
1312 #ifdef CONFIG_PROC_FS
1313 struct xt_names_priv
{
1314 struct seq_net_private p
;
1317 static void *xt_table_seq_start(struct seq_file
*seq
, loff_t
*pos
)
1319 struct xt_names_priv
*priv
= seq
->private;
1320 struct net
*net
= seq_file_net(seq
);
1321 u_int8_t af
= priv
->af
;
1323 mutex_lock(&xt
[af
].mutex
);
1324 return seq_list_start(&net
->xt
.tables
[af
], *pos
);
1327 static void *xt_table_seq_next(struct seq_file
*seq
, void *v
, loff_t
*pos
)
1329 struct xt_names_priv
*priv
= seq
->private;
1330 struct net
*net
= seq_file_net(seq
);
1331 u_int8_t af
= priv
->af
;
1333 return seq_list_next(v
, &net
->xt
.tables
[af
], pos
);
1336 static void xt_table_seq_stop(struct seq_file
*seq
, void *v
)
1338 struct xt_names_priv
*priv
= seq
->private;
1339 u_int8_t af
= priv
->af
;
1341 mutex_unlock(&xt
[af
].mutex
);
1344 static int xt_table_seq_show(struct seq_file
*seq
, void *v
)
1346 struct xt_table
*table
= list_entry(v
, struct xt_table
, list
);
1349 seq_printf(seq
, "%s\n", table
->name
);
1353 static const struct seq_operations xt_table_seq_ops
= {
1354 .start
= xt_table_seq_start
,
1355 .next
= xt_table_seq_next
,
1356 .stop
= xt_table_seq_stop
,
1357 .show
= xt_table_seq_show
,
1360 static int xt_table_open(struct inode
*inode
, struct file
*file
)
1363 struct xt_names_priv
*priv
;
1365 ret
= seq_open_net(inode
, file
, &xt_table_seq_ops
,
1366 sizeof(struct xt_names_priv
));
1368 priv
= ((struct seq_file
*)file
->private_data
)->private;
1369 priv
->af
= (unsigned long)PDE_DATA(inode
);
1374 static const struct file_operations xt_table_ops
= {
1375 .open
= xt_table_open
,
1377 .llseek
= seq_lseek
,
1378 .release
= seq_release_net
,
1382 * Traverse state for ip{,6}_{tables,matches} for helping crossing
1383 * the multi-AF mutexes.
1385 struct nf_mttg_trav
{
1386 struct list_head
*head
, *curr
;
1387 uint8_t class, nfproto
;
1392 MTTG_TRAV_NFP_UNSPEC
,
1397 static void *xt_mttg_seq_next(struct seq_file
*seq
, void *v
, loff_t
*ppos
,
1400 static const uint8_t next_class
[] = {
1401 [MTTG_TRAV_NFP_UNSPEC
] = MTTG_TRAV_NFP_SPEC
,
1402 [MTTG_TRAV_NFP_SPEC
] = MTTG_TRAV_DONE
,
1404 struct nf_mttg_trav
*trav
= seq
->private;
1406 switch (trav
->class) {
1407 case MTTG_TRAV_INIT
:
1408 trav
->class = MTTG_TRAV_NFP_UNSPEC
;
1409 mutex_lock(&xt
[NFPROTO_UNSPEC
].mutex
);
1410 trav
->head
= trav
->curr
= is_target
?
1411 &xt
[NFPROTO_UNSPEC
].target
: &xt
[NFPROTO_UNSPEC
].match
;
1413 case MTTG_TRAV_NFP_UNSPEC
:
1414 trav
->curr
= trav
->curr
->next
;
1415 if (trav
->curr
!= trav
->head
)
1417 mutex_unlock(&xt
[NFPROTO_UNSPEC
].mutex
);
1418 mutex_lock(&xt
[trav
->nfproto
].mutex
);
1419 trav
->head
= trav
->curr
= is_target
?
1420 &xt
[trav
->nfproto
].target
: &xt
[trav
->nfproto
].match
;
1421 trav
->class = next_class
[trav
->class];
1423 case MTTG_TRAV_NFP_SPEC
:
1424 trav
->curr
= trav
->curr
->next
;
1425 if (trav
->curr
!= trav
->head
)
1437 static void *xt_mttg_seq_start(struct seq_file
*seq
, loff_t
*pos
,
1440 struct nf_mttg_trav
*trav
= seq
->private;
1443 trav
->class = MTTG_TRAV_INIT
;
1444 for (j
= 0; j
< *pos
; ++j
)
1445 if (xt_mttg_seq_next(seq
, NULL
, NULL
, is_target
) == NULL
)
1450 static void xt_mttg_seq_stop(struct seq_file
*seq
, void *v
)
1452 struct nf_mttg_trav
*trav
= seq
->private;
1454 switch (trav
->class) {
1455 case MTTG_TRAV_NFP_UNSPEC
:
1456 mutex_unlock(&xt
[NFPROTO_UNSPEC
].mutex
);
1458 case MTTG_TRAV_NFP_SPEC
:
1459 mutex_unlock(&xt
[trav
->nfproto
].mutex
);
1464 static void *xt_match_seq_start(struct seq_file
*seq
, loff_t
*pos
)
1466 return xt_mttg_seq_start(seq
, pos
, false);
1469 static void *xt_match_seq_next(struct seq_file
*seq
, void *v
, loff_t
*ppos
)
1471 return xt_mttg_seq_next(seq
, v
, ppos
, false);
1474 static int xt_match_seq_show(struct seq_file
*seq
, void *v
)
1476 const struct nf_mttg_trav
*trav
= seq
->private;
1477 const struct xt_match
*match
;
1479 switch (trav
->class) {
1480 case MTTG_TRAV_NFP_UNSPEC
:
1481 case MTTG_TRAV_NFP_SPEC
:
1482 if (trav
->curr
== trav
->head
)
1484 match
= list_entry(trav
->curr
, struct xt_match
, list
);
1486 seq_printf(seq
, "%s\n", match
->name
);
1491 static const struct seq_operations xt_match_seq_ops
= {
1492 .start
= xt_match_seq_start
,
1493 .next
= xt_match_seq_next
,
1494 .stop
= xt_mttg_seq_stop
,
1495 .show
= xt_match_seq_show
,
1498 static int xt_match_open(struct inode
*inode
, struct file
*file
)
1500 struct nf_mttg_trav
*trav
;
1501 trav
= __seq_open_private(file
, &xt_match_seq_ops
, sizeof(*trav
));
1505 trav
->nfproto
= (unsigned long)PDE_DATA(inode
);
1509 static const struct file_operations xt_match_ops
= {
1510 .open
= xt_match_open
,
1512 .llseek
= seq_lseek
,
1513 .release
= seq_release_private
,
1516 static void *xt_target_seq_start(struct seq_file
*seq
, loff_t
*pos
)
1518 return xt_mttg_seq_start(seq
, pos
, true);
1521 static void *xt_target_seq_next(struct seq_file
*seq
, void *v
, loff_t
*ppos
)
1523 return xt_mttg_seq_next(seq
, v
, ppos
, true);
1526 static int xt_target_seq_show(struct seq_file
*seq
, void *v
)
1528 const struct nf_mttg_trav
*trav
= seq
->private;
1529 const struct xt_target
*target
;
1531 switch (trav
->class) {
1532 case MTTG_TRAV_NFP_UNSPEC
:
1533 case MTTG_TRAV_NFP_SPEC
:
1534 if (trav
->curr
== trav
->head
)
1536 target
= list_entry(trav
->curr
, struct xt_target
, list
);
1538 seq_printf(seq
, "%s\n", target
->name
);
1543 static const struct seq_operations xt_target_seq_ops
= {
1544 .start
= xt_target_seq_start
,
1545 .next
= xt_target_seq_next
,
1546 .stop
= xt_mttg_seq_stop
,
1547 .show
= xt_target_seq_show
,
1550 static int xt_target_open(struct inode
*inode
, struct file
*file
)
1552 struct nf_mttg_trav
*trav
;
1553 trav
= __seq_open_private(file
, &xt_target_seq_ops
, sizeof(*trav
));
1557 trav
->nfproto
= (unsigned long)PDE_DATA(inode
);
1561 static const struct file_operations xt_target_ops
= {
1562 .open
= xt_target_open
,
1564 .llseek
= seq_lseek
,
1565 .release
= seq_release_private
,
1568 #define FORMAT_TABLES "_tables_names"
1569 #define FORMAT_MATCHES "_tables_matches"
1570 #define FORMAT_TARGETS "_tables_targets"
1572 #endif /* CONFIG_PROC_FS */
1575 * xt_hook_ops_alloc - set up hooks for a new table
1576 * @table: table with metadata needed to set up hooks
1577 * @fn: Hook function
1579 * This function will create the nf_hook_ops that the x_table needs
1580 * to hand to xt_hook_link_net().
1582 struct nf_hook_ops
*
1583 xt_hook_ops_alloc(const struct xt_table
*table
, nf_hookfn
*fn
)
1585 unsigned int hook_mask
= table
->valid_hooks
;
1586 uint8_t i
, num_hooks
= hweight32(hook_mask
);
1588 struct nf_hook_ops
*ops
;
1591 return ERR_PTR(-EINVAL
);
1593 ops
= kcalloc(num_hooks
, sizeof(*ops
), GFP_KERNEL
);
1595 return ERR_PTR(-ENOMEM
);
1597 for (i
= 0, hooknum
= 0; i
< num_hooks
&& hook_mask
!= 0;
1598 hook_mask
>>= 1, ++hooknum
) {
1599 if (!(hook_mask
& 1))
1602 ops
[i
].pf
= table
->af
;
1603 ops
[i
].hooknum
= hooknum
;
1604 ops
[i
].priority
= table
->priority
;
1610 EXPORT_SYMBOL_GPL(xt_hook_ops_alloc
);
1612 int xt_proto_init(struct net
*net
, u_int8_t af
)
1614 #ifdef CONFIG_PROC_FS
1615 char buf
[XT_FUNCTION_MAXNAMELEN
];
1616 struct proc_dir_entry
*proc
;
1621 if (af
>= ARRAY_SIZE(xt_prefix
))
1625 #ifdef CONFIG_PROC_FS
1626 root_uid
= make_kuid(net
->user_ns
, 0);
1627 root_gid
= make_kgid(net
->user_ns
, 0);
1629 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1630 strlcat(buf
, FORMAT_TABLES
, sizeof(buf
));
1631 proc
= proc_create_data(buf
, 0440, net
->proc_net
, &xt_table_ops
,
1632 (void *)(unsigned long)af
);
1635 if (uid_valid(root_uid
) && gid_valid(root_gid
))
1636 proc_set_user(proc
, root_uid
, root_gid
);
1638 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1639 strlcat(buf
, FORMAT_MATCHES
, sizeof(buf
));
1640 proc
= proc_create_data(buf
, 0440, net
->proc_net
, &xt_match_ops
,
1641 (void *)(unsigned long)af
);
1643 goto out_remove_tables
;
1644 if (uid_valid(root_uid
) && gid_valid(root_gid
))
1645 proc_set_user(proc
, root_uid
, root_gid
);
1647 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1648 strlcat(buf
, FORMAT_TARGETS
, sizeof(buf
));
1649 proc
= proc_create_data(buf
, 0440, net
->proc_net
, &xt_target_ops
,
1650 (void *)(unsigned long)af
);
1652 goto out_remove_matches
;
1653 if (uid_valid(root_uid
) && gid_valid(root_gid
))
1654 proc_set_user(proc
, root_uid
, root_gid
);
1659 #ifdef CONFIG_PROC_FS
1661 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1662 strlcat(buf
, FORMAT_MATCHES
, sizeof(buf
));
1663 remove_proc_entry(buf
, net
->proc_net
);
1666 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1667 strlcat(buf
, FORMAT_TABLES
, sizeof(buf
));
1668 remove_proc_entry(buf
, net
->proc_net
);
1673 EXPORT_SYMBOL_GPL(xt_proto_init
);
1675 void xt_proto_fini(struct net
*net
, u_int8_t af
)
1677 #ifdef CONFIG_PROC_FS
1678 char buf
[XT_FUNCTION_MAXNAMELEN
];
1680 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1681 strlcat(buf
, FORMAT_TABLES
, sizeof(buf
));
1682 remove_proc_entry(buf
, net
->proc_net
);
1684 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1685 strlcat(buf
, FORMAT_TARGETS
, sizeof(buf
));
1686 remove_proc_entry(buf
, net
->proc_net
);
1688 strlcpy(buf
, xt_prefix
[af
], sizeof(buf
));
1689 strlcat(buf
, FORMAT_MATCHES
, sizeof(buf
));
1690 remove_proc_entry(buf
, net
->proc_net
);
1691 #endif /*CONFIG_PROC_FS*/
1693 EXPORT_SYMBOL_GPL(xt_proto_fini
);
1696 * xt_percpu_counter_alloc - allocate x_tables rule counter
1698 * @state: pointer to xt_percpu allocation state
1699 * @counter: pointer to counter struct inside the ip(6)/arpt_entry struct
1701 * On SMP, the packet counter [ ip(6)t_entry->counters.pcnt ] will then
1702 * contain the address of the real (percpu) counter.
1704 * Rule evaluation needs to use xt_get_this_cpu_counter() helper
1705 * to fetch the real percpu counter.
1707 * To speed up allocation and improve data locality, a 4kb block is
1710 * xt_percpu_counter_alloc_state contains the base address of the
1711 * allocated page and the current sub-offset.
1713 * returns false on error.
1715 bool xt_percpu_counter_alloc(struct xt_percpu_counter_alloc_state
*state
,
1716 struct xt_counters
*counter
)
1718 BUILD_BUG_ON(XT_PCPU_BLOCK_SIZE
< (sizeof(*counter
) * 2));
1720 if (nr_cpu_ids
<= 1)
1724 state
->mem
= __alloc_percpu(XT_PCPU_BLOCK_SIZE
,
1725 XT_PCPU_BLOCK_SIZE
);
1729 counter
->pcnt
= (__force
unsigned long)(state
->mem
+ state
->off
);
1730 state
->off
+= sizeof(*counter
);
1731 if (state
->off
> (XT_PCPU_BLOCK_SIZE
- sizeof(*counter
))) {
1737 EXPORT_SYMBOL_GPL(xt_percpu_counter_alloc
);
1739 void xt_percpu_counter_free(struct xt_counters
*counters
)
1741 unsigned long pcnt
= counters
->pcnt
;
1743 if (nr_cpu_ids
> 1 && (pcnt
& (XT_PCPU_BLOCK_SIZE
- 1)) == 0)
1744 free_percpu((void __percpu
*)pcnt
);
1746 EXPORT_SYMBOL_GPL(xt_percpu_counter_free
);
1748 static int __net_init
xt_net_init(struct net
*net
)
1752 for (i
= 0; i
< NFPROTO_NUMPROTO
; i
++)
1753 INIT_LIST_HEAD(&net
->xt
.tables
[i
]);
1757 static void __net_exit
xt_net_exit(struct net
*net
)
1761 for (i
= 0; i
< NFPROTO_NUMPROTO
; i
++)
1762 WARN_ON_ONCE(!list_empty(&net
->xt
.tables
[i
]));
1765 static struct pernet_operations xt_net_ops
= {
1766 .init
= xt_net_init
,
1767 .exit
= xt_net_exit
,
1770 static int __init
xt_init(void)
1775 for_each_possible_cpu(i
) {
1776 seqcount_init(&per_cpu(xt_recseq
, i
));
1779 xt
= kmalloc(sizeof(struct xt_af
) * NFPROTO_NUMPROTO
, GFP_KERNEL
);
1783 for (i
= 0; i
< NFPROTO_NUMPROTO
; i
++) {
1784 mutex_init(&xt
[i
].mutex
);
1785 #ifdef CONFIG_COMPAT
1786 mutex_init(&xt
[i
].compat_mutex
);
1787 xt
[i
].compat_tab
= NULL
;
1789 INIT_LIST_HEAD(&xt
[i
].target
);
1790 INIT_LIST_HEAD(&xt
[i
].match
);
1792 rv
= register_pernet_subsys(&xt_net_ops
);
1798 static void __exit
xt_fini(void)
1800 unregister_pernet_subsys(&xt_net_ops
);
1804 module_init(xt_init
);
1805 module_exit(xt_fini
);